Skip to content

Type Alias: GgufMetadataTokenizer

ts
type GgufMetadataTokenizer = {
  ggml: {
     model: "no_vocab" | "llama" | "gpt2" | "bert" | string;
     pre:   | "default"
        | "llama3"
        | "llama-v3"
        | "llama-bpe"
        | "deepseek-llm"
        | "deepseek-coder"
        | "falcon"
        | "falcon3"
        | "mpt"
        | "starcoder"
        | "gpt-2"
        | "phi-2"
        | "jina-es"
        | "jina-de"
        | "jina-v1-en"
        | "jina-v2-es"
        | "jina-v2-de"
        | "jina-v2-code"
        | "refact"
        | "command-r"
        | "qwen2"
        | "stablelm2"
        | "olmo"
        | "dbrx"
        | "smaug-bpe"
        | "poro-chat"
        | "chatglm-bpe"
        | "viking"
        | "jais"
        | "tekken"
        | "smollm"
        | "codeshell"
        | "bloom"
        | "gpt3-finnish"
        | "exaone"
        | "chameleon"
        | "minerva-7b"
        | string;
     tokens: readonly string[];
     token_type: GgufMetadataTokenizerTokenType[];
     token_type_count: number;
     scores: readonly number[];
     merges: readonly string[];
     bos_token_id: number;
     eos_token_id: number;
     eot_token_id: number;
     eom_token_id: number;
     unknown_token_id: number;
     separator_token_id: number;
     padding_token_id: number;
     cls_token_id: number;
     mask_token_id: number;
     add_bos_token: boolean;
     add_eos_token: boolean;
     add_space_prefix: boolean;
     added_tokens: readonly string[];
     fim_pre_token_id: number;
     fim_suf_token_id: number;
     fim_mid_token_id: number;
     fim_pad_token_id: number;
     fim_rep_token_id: number;
     fim_sep_token_id: number;
     prefix_token_id: number;
     suffix_token_id: number;
     middle_token_id: number;
    };
  huggingface: {
     json: string;
    };
  chat_template: string;
};

Defined in: gguf/types/GgufMetadataTypes.ts:224

Type declaration

ggml

ts
readonly ggml: {
  model: "no_vocab" | "llama" | "gpt2" | "bert" | string;
  pre:   | "default"
     | "llama3"
     | "llama-v3"
     | "llama-bpe"
     | "deepseek-llm"
     | "deepseek-coder"
     | "falcon"
     | "falcon3"
     | "mpt"
     | "starcoder"
     | "gpt-2"
     | "phi-2"
     | "jina-es"
     | "jina-de"
     | "jina-v1-en"
     | "jina-v2-es"
     | "jina-v2-de"
     | "jina-v2-code"
     | "refact"
     | "command-r"
     | "qwen2"
     | "stablelm2"
     | "olmo"
     | "dbrx"
     | "smaug-bpe"
     | "poro-chat"
     | "chatglm-bpe"
     | "viking"
     | "jais"
     | "tekken"
     | "smollm"
     | "codeshell"
     | "bloom"
     | "gpt3-finnish"
     | "exaone"
     | "chameleon"
     | "minerva-7b"
     | string;
  tokens: readonly string[];
  token_type: GgufMetadataTokenizerTokenType[];
  token_type_count: number;
  scores: readonly number[];
  merges: readonly string[];
  bos_token_id: number;
  eos_token_id: number;
  eot_token_id: number;
  eom_token_id: number;
  unknown_token_id: number;
  separator_token_id: number;
  padding_token_id: number;
  cls_token_id: number;
  mask_token_id: number;
  add_bos_token: boolean;
  add_eos_token: boolean;
  add_space_prefix: boolean;
  added_tokens: readonly string[];
  fim_pre_token_id: number;
  fim_suf_token_id: number;
  fim_mid_token_id: number;
  fim_pad_token_id: number;
  fim_rep_token_id: number;
  fim_sep_token_id: number;
  prefix_token_id: number;
  suffix_token_id: number;
  middle_token_id: number;
};

ggml.model

ts
readonly model: "no_vocab" | "llama" | "gpt2" | "bert" | string;

ggml.pre?

ts
readonly optional pre: 
  | "default"
  | "llama3"
  | "llama-v3"
  | "llama-bpe"
  | "deepseek-llm"
  | "deepseek-coder"
  | "falcon"
  | "falcon3"
  | "mpt"
  | "starcoder"
  | "gpt-2"
  | "phi-2"
  | "jina-es"
  | "jina-de"
  | "jina-v1-en"
  | "jina-v2-es"
  | "jina-v2-de"
  | "jina-v2-code"
  | "refact"
  | "command-r"
  | "qwen2"
  | "stablelm2"
  | "olmo"
  | "dbrx"
  | "smaug-bpe"
  | "poro-chat"
  | "chatglm-bpe"
  | "viking"
  | "jais"
  | "tekken"
  | "smollm"
  | "codeshell"
  | "bloom"
  | "gpt3-finnish"
  | "exaone"
  | "chameleon"
  | "minerva-7b"
  | string;

ggml.tokens

ts
readonly tokens: readonly string[];

ggml.token_type

ts
readonly token_type: GgufMetadataTokenizerTokenType[];

ggml.token_type_count?

ts
readonly optional token_type_count: number;

ggml.scores?

ts
readonly optional scores: readonly number[];

ggml.merges?

ts
readonly optional merges: readonly string[];

ggml.bos_token_id?

ts
readonly optional bos_token_id: number;

ggml.eos_token_id?

ts
readonly optional eos_token_id: number;

ggml.eot_token_id?

ts
readonly optional eot_token_id: number;

ggml.eom_token_id?

ts
readonly optional eom_token_id: number;

ggml.unknown_token_id?

ts
readonly optional unknown_token_id: number;

ggml.separator_token_id?

ts
readonly optional separator_token_id: number;

ggml.padding_token_id?

ts
readonly optional padding_token_id: number;

ggml.cls_token_id?

ts
readonly optional cls_token_id: number;

ggml.mask_token_id?

ts
readonly optional mask_token_id: number;

ggml.add_bos_token?

ts
readonly optional add_bos_token: boolean;

ggml.add_eos_token?

ts
readonly optional add_eos_token: boolean;

ggml.add_space_prefix?

ts
readonly optional add_space_prefix: boolean;

ggml.added_tokens?

ts
readonly optional added_tokens: readonly string[];

ggml.fim_pre_token_id?

ts
readonly optional fim_pre_token_id: number;

ggml.fim_suf_token_id?

ts
readonly optional fim_suf_token_id: number;

ggml.fim_mid_token_id?

ts
readonly optional fim_mid_token_id: number;

ggml.fim_pad_token_id?

ts
readonly optional fim_pad_token_id: number;

ggml.fim_rep_token_id?

ts
readonly optional fim_rep_token_id: number;

ggml.fim_sep_token_id?

ts
readonly optional fim_sep_token_id: number;

ggml.prefix_token_id?

ts
readonly optional prefix_token_id: number;
Deprecated

ggml.suffix_token_id?

ts
readonly optional suffix_token_id: number;
Deprecated

ggml.middle_token_id?

ts
readonly optional middle_token_id: number;
Deprecated

huggingface?

ts
readonly optional huggingface: {
  json: string;
};

huggingface.json?

ts
readonly optional json: string;

chat_template?

ts
readonly optional chat_template: string;