Skip to content

Commit 901c27f

Browse files
committed
Update llama-quant.cpp
1 parent 4818abb commit 901c27f

File tree

1 file changed

+4
-0
lines changed

1 file changed

+4
-0
lines changed

src/llama-quant.cpp

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -338,6 +338,8 @@ static ggml_type llama_tensor_get_type(quantize_state_impl & qs, ggml_type new_t
338338
// new_type = GGML_TYPE_IQ2_S;
339339
new_type = GGML_TYPE_Q4_K;
340340
}
341+
else
342+
new_type = GGML_TYPE_Q4_K;
341343
} else if (name.find("attn_q.weight") != std::string::npos) {
342344
if (ftype == LLAMA_FTYPE_MOSTLY_IQ3_XS) {
343345
// new_type = GGML_TYPE_IQ3_XXS;
@@ -347,6 +349,8 @@ static ggml_type llama_tensor_get_type(quantize_state_impl & qs, ggml_type new_t
347349
// new_type = GGML_TYPE_IQ2_S;
348350
new_type = GGML_TYPE_Q4_K;
349351
}
352+
else
353+
new_type = GGML_TYPE_Q4_K;
350354
} else if (name.find("ffn_down.weight") != std::string::npos) {
351355
// First 3 Layers
352356
new_type = GGML_TYPE_Q6_K;

0 commit comments

Comments
 (0)