Skip to content

Commit d336217

Browse files
committed
Embeddings and Output changes
1 parent f35153a commit d336217

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

src/llama.cpp

+3-3
Original file line numberDiff line numberDiff line change
@@ -15603,7 +15603,7 @@ static ggml_type llama_tensor_get_type(quantize_state_internal & qs, ggml_type n
1560315603
new_type = GGML_TYPE_Q6_K;
1560415604
}
1560515605
else if (ftype == LLAMA_FTYPE_MOSTLY_Q6_K_ML) {
15606-
new_type = GGML_TYPE_Q8_0;
15606+
new_type = GGML_TYPE_Q6_K;
1560715607
}
1560815608
else if (ftype == LLAMA_FTYPE_MOSTLY_IQ5_XSR || ftype == LLAMA_FTYPE_MOSTLY_IQ5_SR || ftype == LLAMA_FTYPE_MOSTLY_IQ5_MR ||
1560915609
ftype == LLAMA_FTYPE_MOSTLY_IQ5_LR || ftype == LLAMA_FTYPE_MOSTLY_IQ5_BLR) {
@@ -15741,7 +15741,7 @@ static ggml_type llama_tensor_get_type(quantize_state_internal & qs, ggml_type n
1574115741
else if (ftype == LLAMA_FTYPE_MOSTLY_IQ4_SR || ftype == LLAMA_FTYPE_MOSTLY_IQ4_MR || ftype == LLAMA_FTYPE_MOSTLY_IQ4_LR ||
1574215742
ftype == LLAMA_FTYPE_MOSTLY_IQ4_BLR) {
1574315743
if (qs.model.hparams.n_expert >= 8 || qs.model.hparams.n_gqa() >= 12) new_type = GGML_TYPE_Q5_K;
15744-
else new_type = GGML_TYPE_IQ4_XS;
15744+
else new_type = GGML_TYPE_Q8_0;
1574515745
}
1574615746
else if (ftype == LLAMA_FTYPE_MOSTLY_Q4_K_ML) {
1574715747
if (qs.model.hparams.n_expert >= 8 || qs.model.hparams.n_gqa() >= 12) new_type = GGML_TYPE_Q5_K;
@@ -15753,7 +15753,7 @@ static ggml_type llama_tensor_get_type(quantize_state_internal & qs, ggml_type n
1575315753
}
1575415754
else if (ftype == LLAMA_FTYPE_MOSTLY_Q6_K_ML) {
1575515755
if (qs.model.hparams.n_expert >= 8 || qs.model.hparams.n_gqa() >= 12) new_type = GGML_TYPE_Q8_0;
15756-
else new_type = GGML_TYPE_Q6_K;
15756+
else new_type = GGML_TYPE_Q8_0;
1575715757
}
1575815758
else if (ftype == LLAMA_FTYPE_MOSTLY_IQ5_XSR || ftype == LLAMA_FTYPE_MOSTLY_IQ5_SR || ftype == LLAMA_FTYPE_MOSTLY_IQ5_MR ||
1575915759
ftype == LLAMA_FTYPE_MOSTLY_IQ5_LR || ftype == LLAMA_FTYPE_MOSTLY_IQ5_BLR) {

0 commit comments

Comments
 (0)