diff --git a/utils/convert-hf-to-gguf-bitnet.py b/utils/convert-hf-to-gguf-bitnet.py index f525f58f..59e8456a 100644 --- a/utils/convert-hf-to-gguf-bitnet.py +++ b/utils/convert-hf-to-gguf-bitnet.py @@ -949,7 +949,7 @@ def prepare_tensors(self): raise ValueError(f"Unprocessed experts: {experts}") -@Model.register("BitnetForCausalLM") +@Model.register("BitnetForCausalLM", "BitNetForCausalLM") class BitnetModel(Model): model_arch = gguf.MODEL_ARCH.BITNET diff --git a/utils/generate-dummy-bitnet-model.py b/utils/generate-dummy-bitnet-model.py index be3f6cda..f39e5415 100644 --- a/utils/generate-dummy-bitnet-model.py +++ b/utils/generate-dummy-bitnet-model.py @@ -773,7 +773,7 @@ def preprocess_weights_tl2( return weight -@Model.register("BitnetForCausalLM") +@Model.register("BitnetForCausalLM", "BitNetForCausalLM") class BitnetModel(Model): model_arch = gguf.MODEL_ARCH.BITNET params: str = "" @@ -1045,4 +1045,4 @@ def parse_args() -> argparse.Namespace: if __name__ == '__main__': args = parse_args() - main() \ No newline at end of file + main()