Skip to content

Commit 0e41b94

Browse files
committed
improve detection for 70B.
1 parent fb44d72 commit 0e41b94

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

llama.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1076,7 +1076,7 @@ static void llama_model_load_internal(
10761076
// LLaMAv2
10771077
// TODO: temporary until GGUF
10781078
//patch for llama2 gqa
1079-
if (model.type == e_model::MODEL_65B && hparams.n_mult >= 4096) {
1079+
if (model.type == e_model::MODEL_65B && hparams.n_mult == 4096) {
10801080
fprintf(stderr, "%s: Applying KCPP Patch for 70B model, setting GQA to 8\n", __func__);
10811081
n_gqa = 8;
10821082
}

0 commit comments

Comments
 (0)