Type Alias: GgufMetadataDefaultArchitectureType
ts
type GgufMetadataDefaultArchitectureType: {
vocab_size: number;
context_length: number;
embedding_length: number;
block_count: number;
feed_forward_length: number;
use_parallel_residual: boolean;
tensor_data_layout: string;
expert_count: number;
expert_used_count: number;
pooling_type: GgufMetadataArchitecturePoolingType;
logit_scale: number;
attention: {
head_count: number;
head_count_kv: number;
max_alibi_bias: number;
clamp_kqv: number;
layer_norm_epsilon: number;
layer_norm_rms_epsilon: number;
key_length: number;
value_length: number;
causal: boolean;
};
rope: {
dimension_count: number;
freq_base: number;
scale_linear: number;
scaling: {
type: "none" | "linear" | "yarn" | string;
factor: number;
original_context_length: number;
finetuned: boolean;
};
};
ssm: {
conv_kernel: number;
inner_size: number;
state_size: number;
time_step_rank: number;
};
};
Type declaration
vocab_size?
ts
readonly optional vocab_size: number;
context_length?
ts
readonly optional context_length: number;
embedding_length?
ts
readonly optional embedding_length: number;
block_count?
ts
readonly optional block_count: number;
feed_forward_length?
ts
readonly optional feed_forward_length: number;
use_parallel_residual?
ts
readonly optional use_parallel_residual: boolean;
tensor_data_layout?
ts
readonly optional tensor_data_layout: string;
expert_count?
ts
readonly optional expert_count: number;
expert_used_count?
ts
readonly optional expert_used_count: number;
pooling_type?
ts
readonly optional pooling_type: GgufMetadataArchitecturePoolingType;
logit_scale?
ts
readonly optional logit_scale: number;
attention?
ts
readonly optional attention: {
head_count: number;
head_count_kv: number;
max_alibi_bias: number;
clamp_kqv: number;
layer_norm_epsilon: number;
layer_norm_rms_epsilon: number;
key_length: number;
value_length: number;
causal: boolean;
};
attention.head_count?
ts
readonly optional head_count: number;
attention.head_count_kv?
ts
readonly optional head_count_kv: number;
attention.max_alibi_bias?
ts
readonly optional max_alibi_bias: number;
attention.clamp_kqv?
ts
readonly optional clamp_kqv: number;
attention.layer_norm_epsilon?
ts
readonly optional layer_norm_epsilon: number;
attention.layer_norm_rms_epsilon?
ts
readonly optional layer_norm_rms_epsilon: number;
attention.key_length?
ts
readonly optional key_length: number;
attention.value_length?
ts
readonly optional value_length: number;
attention.causal?
ts
readonly optional causal: boolean;
rope?
ts
readonly optional rope: {
dimension_count: number;
freq_base: number;
scale_linear: number;
scaling: {
type: "none" | "linear" | "yarn" | string;
factor: number;
original_context_length: number;
finetuned: boolean;
};
};
rope.dimension_count?
ts
readonly optional dimension_count: number;
rope.freq_base?
ts
readonly optional freq_base: number;
rope.scale_linear?
ts
readonly optional scale_linear: number;
rope.scaling?
ts
readonly optional scaling: {
type: "none" | "linear" | "yarn" | string;
factor: number;
original_context_length: number;
finetuned: boolean;
};
rope.scaling.type?
ts
readonly optional type: "none" | "linear" | "yarn" | string;
rope.scaling.factor?
ts
readonly optional factor: number;
rope.scaling.original_context_length?
ts
readonly optional original_context_length: number;
rope.scaling.finetuned?
ts
readonly optional finetuned: boolean;
ssm?
ts
readonly optional ssm: {
conv_kernel: number;
inner_size: number;
state_size: number;
time_step_rank: number;
};
ssm.conv_kernel?
ts
readonly optional conv_kernel: number;
ssm.inner_size?
ts
readonly optional inner_size: number;
ssm.state_size?
ts
readonly optional state_size: number;
ssm.time_step_rank?
ts
readonly optional time_step_rank: number;