From 9ac410e54cab3042b153d100702b69440692c234 Mon Sep 17 00:00:00 2001 From: qjtdsqqm94akkyysgjdqo3hx1jn6l17 <18874@student.vgu.edu.vn> Date: Tue, 22 Apr 2025 17:31:02 +0700 Subject: [PATCH 1/2] Register alternative capitalization of BitnetForCausalLM (with a capital N) --- utils/convert-hf-to-gguf-bitnet.py | 2 +- utils/generate-dummy-bitnet-model.py | 4 ++-- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/utils/convert-hf-to-gguf-bitnet.py b/utils/convert-hf-to-gguf-bitnet.py index f525f58f..7316d656 100644 --- a/utils/convert-hf-to-gguf-bitnet.py +++ b/utils/convert-hf-to-gguf-bitnet.py @@ -949,7 +949,7 @@ def prepare_tensors(self): raise ValueError(f"Unprocessed experts: {experts}") -@Model.register("BitnetForCausalLM") +@Model.register("BitnetForCausalLM", "BitNetForCausalLM" class BitnetModel(Model): model_arch = gguf.MODEL_ARCH.BITNET diff --git a/utils/generate-dummy-bitnet-model.py b/utils/generate-dummy-bitnet-model.py index be3f6cda..053d7a71 100644 --- a/utils/generate-dummy-bitnet-model.py +++ b/utils/generate-dummy-bitnet-model.py @@ -773,7 +773,7 @@ def preprocess_weights_tl2( return weight -@Model.register("BitnetForCausalLM") +@Model.register("BitnetForCausalLM", "BitNetForCausalLM" class BitnetModel(Model): model_arch = gguf.MODEL_ARCH.BITNET params: str = "" @@ -1045,4 +1045,4 @@ def parse_args() -> argparse.Namespace: if __name__ == '__main__': args = parse_args() - main() \ No newline at end of file + main() From 9e0f32a56f7a6bd6ad2e5cdeed2e0b70ca4e100f Mon Sep 17 00:00:00 2001 From: qjtdsqqm94akkyysgjdqo3hx1jn6l17 <18874@student.vgu.edu.vn> Date: Tue, 22 Apr 2025 17:37:02 +0700 Subject: [PATCH 2/2] Fix dumb mistake --- utils/convert-hf-to-gguf-bitnet.py | 2 +- utils/generate-dummy-bitnet-model.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/utils/convert-hf-to-gguf-bitnet.py b/utils/convert-hf-to-gguf-bitnet.py index 7316d656..59e8456a 100644 --- a/utils/convert-hf-to-gguf-bitnet.py +++ b/utils/convert-hf-to-gguf-bitnet.py @@ -949,7 +949,7 @@ def prepare_tensors(self): raise ValueError(f"Unprocessed experts: {experts}") -@Model.register("BitnetForCausalLM", "BitNetForCausalLM" +@Model.register("BitnetForCausalLM", "BitNetForCausalLM") class BitnetModel(Model): model_arch = gguf.MODEL_ARCH.BITNET diff --git a/utils/generate-dummy-bitnet-model.py b/utils/generate-dummy-bitnet-model.py index 053d7a71..f39e5415 100644 --- a/utils/generate-dummy-bitnet-model.py +++ b/utils/generate-dummy-bitnet-model.py @@ -773,7 +773,7 @@ def preprocess_weights_tl2( return weight -@Model.register("BitnetForCausalLM", "BitNetForCausalLM" +@Model.register("BitnetForCausalLM", "BitNetForCausalLM") class BitnetModel(Model): model_arch = gguf.MODEL_ARCH.BITNET params: str = ""