Skip to content
This repository was archived by the owner on Jun 3, 2025. It is now read-only.

Commit 3dd1f8d

Browse files
authored
Export files required by OPT to load the tokenizer (#1571)
* initial commit * include Tuans proposal * Update src/sparseml/transformers/export.py
1 parent 4fb5d27 commit 3dd1f8d

File tree

1 file changed

+8
-3
lines changed

1 file changed

+8
-3
lines changed

src/sparseml/transformers/export.py

Lines changed: 8 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -91,13 +91,18 @@
9191
__all__ = ["export_transformer_to_onnx", "load_task_model"]
9292

9393
MODEL_ONNX_NAME = "model.onnx"
94-
EXTERNAL_ONNX_DATA_NAME = "model.data"
95-
MANDATORY_DEPLOYMENT_FILES: List[str] = [
94+
MANDATORY_DEPLOYMENT_FILES = [
9695
MODEL_ONNX_NAME,
9796
"tokenizer_config.json",
9897
"config.json",
9998
]
100-
OPTIONAL_DEPLOYMENT_FILES: List[str] = [EXTERNAL_ONNX_DATA_NAME, "tokenizer.json"]
99+
EXTERNAL_ONNX_DATA_NAME = ["model.data"]
100+
OPT_TOKENIZER_FILES = ["special_tokens_map.json", "vocab.json", "merges.txt"]
101+
102+
OPTIONAL_DEPLOYMENT_FILES: List[str] = ["tokenizer.json"]
103+
OPTIONAL_DEPLOYMENT_FILES.extend(EXTERNAL_ONNX_DATA_NAME)
104+
OPTIONAL_DEPLOYMENT_FILES.extend(OPT_TOKENIZER_FILES)
105+
101106

102107
_LOGGER = logging.getLogger(__name__)
103108

0 commit comments

Comments
 (0)