We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 2a86928 commit a4fdb39Copy full SHA for a4fdb39
fastdeploy/worker/worker_process.py
@@ -735,7 +735,8 @@ def initialize_fd_config(config_or_args) -> FDConfig:
735
736
# Handle vocabulary size
737
model_config.ori_vocab_size = model_config_dict.get("vocab_size", -1)
738
- if "Ernie4_5_ForCausalLM" in model_config_dict.get("architectures", []):
+ archs = model_config_dict.get("architectures", [])
739
+ if "Ernie4_5_ForCausalLM" in archs or "Ernie4_5_MoeForCausalLM" in archs:
740
model_config.ori_vocab_size = getattr(config_or_args, 'ori_vocab_size', model_config.ori_vocab_size)
741
742
# Handle DeepseekV3 specific config
0 commit comments