We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4e38809 commit 25c6e82Copy full SHA for 25c6e82
llama.cpp
@@ -3860,7 +3860,7 @@ static void llm_load_hparams(
3860
switch (hparams.n_layer) {
3861
case 22: model.type = e_model::MODEL_1B; break;
3862
case 26: model.type = e_model::MODEL_3B; break;
3863
- case 32: model.type = hparams.n_head == hparams.n_head_kv ? e_model::MODEL_7B : e_model::MODEL_8B; break; // LLaMa 8B v3 uses GQA
+ case 32: model.type = hparams.n_vocab < 40000 ? e_model::MODEL_7B : e_model::MODEL_8B; break;
3864
case 40: model.type = e_model::MODEL_13B; break;
3865
case 48: model.type = e_model::MODEL_34B; break;
3866
case 60: model.type = e_model::MODEL_30B; break;
0 commit comments