Type Alias: GgufMetadataTokenizer
ts
type GgufMetadataTokenizer = {
ggml: {
model: "no_vocab" | "llama" | "gpt2" | "bert" | string;
pre: | "default"
| "llama3"
| "llama-v3"
| "llama-bpe"
| "deepseek-llm"
| "deepseek-coder"
| "falcon"
| "falcon3"
| "mpt"
| "starcoder"
| "gpt-2"
| "phi-2"
| "jina-es"
| "jina-de"
| "jina-v1-en"
| "jina-v2-es"
| "jina-v2-de"
| "jina-v2-code"
| "refact"
| "command-r"
| "qwen2"
| "stablelm2"
| "olmo"
| "dbrx"
| "smaug-bpe"
| "poro-chat"
| "chatglm-bpe"
| "viking"
| "jais"
| "tekken"
| "smollm"
| "codeshell"
| "bloom"
| "gpt3-finnish"
| "exaone"
| "chameleon"
| "minerva-7b"
| string;
tokens: readonly string[];
token_type: GgufMetadataTokenizerTokenType[];
token_type_count: number;
scores: readonly number[];
merges: readonly string[];
bos_token_id: number;
eos_token_id: number;
eot_token_id: number;
eom_token_id: number;
unknown_token_id: number;
separator_token_id: number;
padding_token_id: number;
cls_token_id: number;
mask_token_id: number;
add_bos_token: boolean;
add_eos_token: boolean;
add_space_prefix: boolean;
added_tokens: readonly string[];
fim_pre_token_id: number;
fim_suf_token_id: number;
fim_mid_token_id: number;
fim_pad_token_id: number;
fim_rep_token_id: number;
fim_sep_token_id: number;
prefix_token_id: number;
suffix_token_id: number;
middle_token_id: number;
};
huggingface: {
json: string;
};
chat_template: string;
};
Defined in: gguf/types/GgufMetadataTypes.ts:224
Type declaration
ggml
ts
readonly ggml: {
model: "no_vocab" | "llama" | "gpt2" | "bert" | string;
pre: | "default"
| "llama3"
| "llama-v3"
| "llama-bpe"
| "deepseek-llm"
| "deepseek-coder"
| "falcon"
| "falcon3"
| "mpt"
| "starcoder"
| "gpt-2"
| "phi-2"
| "jina-es"
| "jina-de"
| "jina-v1-en"
| "jina-v2-es"
| "jina-v2-de"
| "jina-v2-code"
| "refact"
| "command-r"
| "qwen2"
| "stablelm2"
| "olmo"
| "dbrx"
| "smaug-bpe"
| "poro-chat"
| "chatglm-bpe"
| "viking"
| "jais"
| "tekken"
| "smollm"
| "codeshell"
| "bloom"
| "gpt3-finnish"
| "exaone"
| "chameleon"
| "minerva-7b"
| string;
tokens: readonly string[];
token_type: GgufMetadataTokenizerTokenType[];
token_type_count: number;
scores: readonly number[];
merges: readonly string[];
bos_token_id: number;
eos_token_id: number;
eot_token_id: number;
eom_token_id: number;
unknown_token_id: number;
separator_token_id: number;
padding_token_id: number;
cls_token_id: number;
mask_token_id: number;
add_bos_token: boolean;
add_eos_token: boolean;
add_space_prefix: boolean;
added_tokens: readonly string[];
fim_pre_token_id: number;
fim_suf_token_id: number;
fim_mid_token_id: number;
fim_pad_token_id: number;
fim_rep_token_id: number;
fim_sep_token_id: number;
prefix_token_id: number;
suffix_token_id: number;
middle_token_id: number;
};
ggml.model
ts
readonly model: "no_vocab" | "llama" | "gpt2" | "bert" | string;
ggml.pre?
ts
readonly optional pre:
| "default"
| "llama3"
| "llama-v3"
| "llama-bpe"
| "deepseek-llm"
| "deepseek-coder"
| "falcon"
| "falcon3"
| "mpt"
| "starcoder"
| "gpt-2"
| "phi-2"
| "jina-es"
| "jina-de"
| "jina-v1-en"
| "jina-v2-es"
| "jina-v2-de"
| "jina-v2-code"
| "refact"
| "command-r"
| "qwen2"
| "stablelm2"
| "olmo"
| "dbrx"
| "smaug-bpe"
| "poro-chat"
| "chatglm-bpe"
| "viking"
| "jais"
| "tekken"
| "smollm"
| "codeshell"
| "bloom"
| "gpt3-finnish"
| "exaone"
| "chameleon"
| "minerva-7b"
| string;
ggml.tokens
ts
readonly tokens: readonly string[];
ggml.token_type
ts
readonly token_type: GgufMetadataTokenizerTokenType[];
ggml.token_type_count?
ts
readonly optional token_type_count: number;
ggml.scores?
ts
readonly optional scores: readonly number[];
ggml.merges?
ts
readonly optional merges: readonly string[];
ggml.bos_token_id?
ts
readonly optional bos_token_id: number;
ggml.eos_token_id?
ts
readonly optional eos_token_id: number;
ggml.eot_token_id?
ts
readonly optional eot_token_id: number;
ggml.eom_token_id?
ts
readonly optional eom_token_id: number;
ggml.unknown_token_id?
ts
readonly optional unknown_token_id: number;
ggml.separator_token_id?
ts
readonly optional separator_token_id: number;
ggml.padding_token_id?
ts
readonly optional padding_token_id: number;
ggml.cls_token_id?
ts
readonly optional cls_token_id: number;
ggml.mask_token_id?
ts
readonly optional mask_token_id: number;
ggml.add_bos_token?
ts
readonly optional add_bos_token: boolean;
ggml.add_eos_token?
ts
readonly optional add_eos_token: boolean;
ggml.add_space_prefix?
ts
readonly optional add_space_prefix: boolean;
ggml.added_tokens?
ts
readonly optional added_tokens: readonly string[];
ggml.fim_pre_token_id?
ts
readonly optional fim_pre_token_id: number;
ggml.fim_suf_token_id?
ts
readonly optional fim_suf_token_id: number;
ggml.fim_mid_token_id?
ts
readonly optional fim_mid_token_id: number;
ggml.fim_pad_token_id?
ts
readonly optional fim_pad_token_id: number;
ggml.fim_rep_token_id?
ts
readonly optional fim_rep_token_id: number;
ggml.fim_sep_token_id?
ts
readonly optional fim_sep_token_id: number;
ggml.prefix_token_id?
ts
readonly optional prefix_token_id: number;
Deprecated
ggml.suffix_token_id?
ts
readonly optional suffix_token_id: number;
Deprecated
ggml.middle_token_id?
ts
readonly optional middle_token_id: number;
Deprecated
huggingface?
ts
readonly optional huggingface: {
json: string;
};
huggingface.json?
ts
readonly optional json: string;
chat_template?
ts
readonly optional chat_template: string;