Skip to content

Commit 9b63d76

Browse files
committed
Update llama-quant.cpp
Update llama-quant.cpp
1 parent e79b6ff commit 9b63d76

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

src/llama-quant.cpp

+3-3
Original file line numberDiff line numberDiff line change
@@ -255,7 +255,7 @@ static ggml_type llama_tensor_get_type(quantize_state_impl & qs, ggml_type new_t
255255
&& qs.model.hparams.n_gqa() >= 2)
256256
new_type = GGML_TYPE_Q5_K;
257257
else if ((ftype == LLAMA_FTYPE_MOSTLY_IQ4_NL || ftype == LLAMA_FTYPE_MOSTLY_IQ4_XS) && qs.model.hparams.n_gqa() >= 2) {
258-
new_type = GGML_TYPE_Q5_K;
258+
new_type = GGML_TYPE_Q6_K;
259259
}
260260
// else if ((ftype == LLAMA_FTYPE_MOSTLY_Q4_K_M || ftype == LLAMA_FTYPE_MOSTLY_Q5_K_M) &&
261261
// use_more_bits(qs.i_attention_wv, qs.n_attention_wv)) new_type = GGML_TYPE_Q6_K;
@@ -360,13 +360,13 @@ static ggml_type llama_tensor_get_type(quantize_state_impl & qs, ggml_type new_t
360360
// if (use_more_bits(i_layer, n_layer)) new_type = GGML_TYPE_Q6_K;
361361
// }
362362
// }
363-
else if (ftype == LLAMA_FTYPE_MOSTLY_Q4_K_S && use_more_bits(i_layer, n_layer)) new_type = GGML_TYPE_Q5_K;
363+
// else if (ftype == LLAMA_FTYPE_MOSTLY_Q4_K_S && use_more_bits(i_layer, n_layer)) new_type = GGML_TYPE_Q5_K;
364364
else if (ftype == LLAMA_FTYPE_MOSTLY_Q4_K_M) new_type = GGML_TYPE_Q5_K;
365365
else if (i_layer < n_layer/8 && (ftype == LLAMA_FTYPE_MOSTLY_IQ4_NL || ftype == LLAMA_FTYPE_MOSTLY_IQ4_XS)
366366
&& !qs.has_imatrix && use_more_bits(i_layer, n_layer)) {
367367
new_type = GGML_TYPE_Q5_K;
368368
}
369-
else if (ftype == LLAMA_FTYPE_MOSTLY_Q5_K_S && use_more_bits(i_layer, n_layer)) new_type = GGML_TYPE_Q6_K;
369+
// else if (ftype == LLAMA_FTYPE_MOSTLY_Q5_K_S && use_more_bits(i_layer, n_layer)) new_type = GGML_TYPE_Q6_K;
370370
else if (ftype == LLAMA_FTYPE_MOSTLY_Q5_K_M) new_type = GGML_TYPE_Q6_K;
371371
else if (ftype == LLAMA_FTYPE_MOSTLY_Q4_K_S && arch != LLM_ARCH_FALCON && i_layer < n_layer/8) {
372372
new_type = GGML_TYPE_Q5_K;

0 commit comments

Comments
 (0)