File tree Expand file tree Collapse file tree 2 files changed +1
-4
lines changed Expand file tree Collapse file tree 2 files changed +1
-4
lines changed Original file line number Diff line number Diff line change @@ -408,14 +408,11 @@ def build_hf_tokenizer(
408408) -> Union [HuggingFaceTokenizer , BaseTokenizer ]:
409409 """
410410 Builds a HuggingFaceTokenizer from the specified path.
411-
412411 This function creates a HuggingFaceTokenizer instance that handles BOS/EOS token
413412 inference and intelligent encoding. The tokenizer automatically detects and loads
414413 from various file formats and infers special token behavior.
415-
416414 Args:
417415 JobConfig: A JobConfig object containing the path to the tokenizer directory.
418-
419416 Returns:
420417 tokenizer (HuggingFaceTokenizer): Loaded tokenizer instance with intelligent BOS/EOS handling
421418 """
Original file line number Diff line number Diff line change @@ -128,7 +128,7 @@ def __init__(self, job_config: JobConfig):
128128
129129 # build dataloader
130130 tokenizer = (
131- self .train_spec .build_tokenizer_fn (job_config . model . tokenizer_path )
131+ self .train_spec .build_tokenizer_fn (job_config )
132132 if self .train_spec .build_tokenizer_fn is not None
133133 else None
134134 )
You can’t perform that action at this time.
0 commit comments