This commit is contained in:
Georgi Gerganov 2024-12-24 09:42:53 +02:00
parent bb0b2c4f56
commit 1e7e3384e1
No known key found for this signature in database
GPG Key ID: 449E073F9DC10735

View File

@ -1531,9 +1531,11 @@ static void llm_load_hparams(
switch (hparams.n_embd) { switch (hparams.n_embd) {
case 384: model.type = e_model::MODEL_33M; break; // MiniLM-L12, bge-small case 384: model.type = e_model::MODEL_33M; break; // MiniLM-L12, bge-small
case 768: model.type = e_model::MODEL_109M; break; // bge-base case 768: model.type = e_model::MODEL_109M; break; // bge-base
default: model.type = e_model::MODEL_UNKNOWN;
} break; } break;
case 24: case 24:
model.type = e_model::MODEL_335M; break; // bge-large model.type = e_model::MODEL_335M; break; // bge-large
default: model.type = e_model::MODEL_UNKNOWN;
} }
} break; } break;
case LLM_ARCH_JINA_BERT_V2: case LLM_ARCH_JINA_BERT_V2:
@ -1547,6 +1549,7 @@ static void llm_load_hparams(
switch (hparams.n_layer) { switch (hparams.n_layer) {
case 4: model.type = e_model::MODEL_33M; break; // jina-embeddings-small case 4: model.type = e_model::MODEL_33M; break; // jina-embeddings-small
case 12: model.type = e_model::MODEL_137M; break; // jina-embeddings-base case 12: model.type = e_model::MODEL_137M; break; // jina-embeddings-base
default: model.type = e_model::MODEL_UNKNOWN;
} }
} break; } break;
case LLM_ARCH_NOMIC_BERT: case LLM_ARCH_NOMIC_BERT:
@ -1570,7 +1573,9 @@ static void llm_load_hparams(
switch (hparams.n_embd) { switch (hparams.n_embd) {
case 2560: model.type = e_model::MODEL_3B; break; case 2560: model.type = e_model::MODEL_3B; break;
case 4096: model.type = e_model::MODEL_7B; break; case 4096: model.type = e_model::MODEL_7B; break;
default: model.type = e_model::MODEL_UNKNOWN;
} break; } break;
default: model.type = e_model::MODEL_UNKNOWN;
} }
// TODO: become GGUF KV parameter // TODO: become GGUF KV parameter
@ -2099,7 +2104,7 @@ static void llm_load_hparams(
ml.get_key(LLM_KV_ATTENTION_GROUPNORM_GROUPS, hparams.n_norm_groups); ml.get_key(LLM_KV_ATTENTION_GROUPNORM_GROUPS, hparams.n_norm_groups);
ml.get_key(LLM_KV_ATTENTION_CAUSAL, hparams.causal_attn); ml.get_key(LLM_KV_ATTENTION_CAUSAL, hparams.causal_attn);
} break; } break;
default: (void)0; default: throw std::runtime_error("unsupported model architecture");
} }
model.ftype = ml.ftype; model.ftype = ml.ftype;