File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -587,7 +587,9 @@ eval_dataset_name: 'c4/en:3.0.1'
587587train_split : ' train'
588588eval_split : ' validation'
589589# for HuggingFace input pipeline (dataset_type=hf)
590+ # Check definition at https://github.com/huggingface/datasets/blob/0feb65dd8733191dd2d1e74215b422fc5939a56a/src/datasets/load.py#L1338-L1408
590591hf_path : ' '
592+ hf_name : ' '
591593hf_data_dir : ' '
592594hf_train_files : ' '
593595hf_eval_split : ' '
Original file line number Diff line number Diff line change @@ -919,7 +919,8 @@ class TfdsDataset(BaseModel):
919919class HfDataset (BaseModel ):
920920 """Configuration specific to HuggingFace datasets."""
921921
922- hf_path : str = Field ("" , description = "Path or name of the Hugging Face dataset." )
922+ hf_path : str = Field ("" , description = "Path of the Hugging Face dataset." )
923+ hf_name : str = Field ("" , description = "Name of the Hugging Face dataset." )
923924 hf_data_dir : PathStr = Field ("" , description = "Data directory for the HF dataset." )
924925 hf_train_files : Optional [str ] = Field (None , description = "Files for the HF training split." )
925926 hf_eval_split : str = Field ("" , description = "Name of the HF evaluation split." )
Original file line number Diff line number Diff line change @@ -352,6 +352,7 @@ def make_hf_train_iterator(
352352 """Load, preprocess dataset and return iterators"""
353353 train_ds = datasets .load_dataset (
354354 config .hf_path ,
355+ name = config .hf_name ,
355356 data_dir = config .hf_data_dir ,
356357 data_files = config .hf_train_files ,
357358 split = config .train_split ,
@@ -404,6 +405,7 @@ def make_hf_eval_iterator(
404405 """Make Hugging Face evaluation iterator. Load and preprocess eval dataset: and return iterator."""
405406 eval_ds = datasets .load_dataset (
406407 config .hf_path ,
408+ name = config .hf_name ,
407409 data_dir = config .hf_data_dir ,
408410 data_files = config .hf_eval_files ,
409411 split = config .hf_eval_split ,
You can’t perform that action at this time.
0 commit comments