@@ -55,7 +55,10 @@ def resolve_transformers_arch(model_config: ModelConfig,
55
55
# "AutoModelFor<Task>": "<your-repo-name>--<config-name>",
56
56
# },
57
57
auto_modules = {
58
- name : get_class_from_dynamic_module (module , model_config .model )
58
+ name :
59
+ get_class_from_dynamic_module (module ,
60
+ model_config .model ,
61
+ revision = model_config .revision )
59
62
for name , module in sorted (auto_map .items (), key = lambda x : x [0 ])
60
63
}
61
64
custom_model_module = auto_modules .get ("AutoModel" )
@@ -97,10 +100,10 @@ def get_model_architecture(
97
100
architectures = ["QuantMixtralForCausalLM" ]
98
101
99
102
vllm_supported_archs = ModelRegistry .get_supported_archs ()
100
- is_vllm_supported = any (arch in vllm_supported_archs
101
- for arch in architectures )
102
- if (not is_vllm_supported
103
- or model_config .model_impl == ModelImpl .TRANSFORMERS ):
103
+ vllm_not_supported = not any (arch in vllm_supported_archs
104
+ for arch in architectures )
105
+ if (model_config . model_impl == ModelImpl . TRANSFORMERS or
106
+ model_config .model_impl != ModelImpl .VLLM and vllm_not_supported ):
104
107
architectures = resolve_transformers_arch (model_config , architectures )
105
108
106
109
model_cls , arch = ModelRegistry .resolve_model_cls (architectures )
0 commit comments