Skip to content

Commit

Permalink
add dataset_root (#11837)
Browse files Browse the repository at this point in the history
  • Loading branch information
suiyoubi authored Jan 17, 2025
1 parent ca4e4f0 commit ad807ae
Showing 1 changed file with 2 additions and 1 deletion.
3 changes: 2 additions & 1 deletion nemo/collections/llm/bert/data/specter.py
Original file line number Diff line number Diff line change
Expand Up @@ -43,6 +43,7 @@ class SpecterDataModule(FineTuningDataModule, IOMixin):

def __init__(
self,
dataset_root: str = None,
seq_length: int = 512,
tokenizer: Optional["TokenizerSpec"] = None,
micro_batch_size: int = 4,
Expand All @@ -61,7 +62,7 @@ def __init__(
self.delete_raw = delete_raw

super().__init__(
dataset_root=get_dataset_root("specter"),
dataset_root=get_dataset_root("specter") if dataset_root is None else dataset_root,
seq_length=seq_length,
tokenizer=tokenizer,
micro_batch_size=micro_batch_size,
Expand Down

0 comments on commit ad807ae

Please sign in to comment.