File tree Expand file tree Collapse file tree 2 files changed +3
-0
lines changed Expand file tree Collapse file tree 2 files changed +3
-0
lines changed Original file line number Diff line number Diff line change @@ -2069,6 +2069,8 @@ def set_gguf_parameters(self):
2069
2069
self .gguf_writer .add_convnext_embedding_length (self .hparams ["convnext" ]["n_embd" ])
2070
2070
self .gguf_writer .add_convnext_block_count (self .hparams ["convnext" ]["n_layer" ])
2071
2071
2072
+ self .gguf_writer .add_causal_attention (False )
2073
+
2072
2074
2073
2075
@Model .register ("Qwen2MoeForCausalLM" )
2074
2076
class Qwen2MoeModel (Model ):
Original file line number Diff line number Diff line change @@ -6393,6 +6393,7 @@ static void llm_load_hparams(
6393
6393
ml.get_key(LLM_KV_ATTENTION_LAYERNORM_EPS, hparams.f_norm_eps);
6394
6394
ml.get_key(LLM_KV_ATTENTION_GROUPNORM_EPS, hparams.f_norm_group_eps);
6395
6395
ml.get_key(LLM_KV_ATTENTION_GROUPNORM_GROUPS, hparams.n_norm_groups);
6396
+ ml.get_key(LLM_KV_ATTENTION_CAUSAL, hparams.causal_attn);
6396
6397
} break;
6397
6398
default: (void)0;
6398
6399
}
You can’t perform that action at this time.
0 commit comments