Skip to content

Commit 55aef3a

Browse files
H-Huangwwwjn
authored andcommitted
Fix CI (#1366)
Current deepseek-v3 branch has a CI job broken
1 parent 72109b9 commit 55aef3a

File tree

2 files changed

+1
-4
lines changed

2 files changed

+1
-4
lines changed

torchtitan/components/tokenizer.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -408,14 +408,11 @@ def build_hf_tokenizer(
408408
) -> Union[HuggingFaceTokenizer, BaseTokenizer]:
409409
"""
410410
Builds a HuggingFaceTokenizer from the specified path.
411-
412411
This function creates a HuggingFaceTokenizer instance that handles BOS/EOS token
413412
inference and intelligent encoding. The tokenizer automatically detects and loads
414413
from various file formats and infers special token behavior.
415-
416414
Args:
417415
JobConfig: A JobConfig object containing the path to the tokenizer directory.
418-
419416
Returns:
420417
tokenizer (HuggingFaceTokenizer): Loaded tokenizer instance with intelligent BOS/EOS handling
421418
"""

torchtitan/train.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -128,7 +128,7 @@ def __init__(self, job_config: JobConfig):
128128

129129
# build dataloader
130130
tokenizer = (
131-
self.train_spec.build_tokenizer_fn(job_config.model.tokenizer_path)
131+
self.train_spec.build_tokenizer_fn(job_config)
132132
if self.train_spec.build_tokenizer_fn is not None
133133
else None
134134
)

0 commit comments

Comments
 (0)