You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: src/MaxText/configs/base.yml
+2-2Lines changed: 2 additions & 2 deletions
Original file line number
Diff line number
Diff line change
@@ -604,10 +604,10 @@ grain_train_files: ''
604
604
grain_eval_files: ''
605
605
grain_train_mixture_config_path: ''# Path to a JSON file specifying the mixture weights for Grain training data.
606
606
grain_file_type: 'arrayrecord'# arrayrecord or parquet
607
-
grain_packing_type: 'first_fit'# 'first_fit' or 'concat_then_split'. See details of the corresponding module in https://google-grain.readthedocs.io/en/latest/grain.experimental.html
607
+
grain_packing_type: 'first_fit'# 'first_fit', 'best_fit' or 'concat_then_split'. See details of the corresponding module in https://google-grain.readthedocs.io/en/latest/grain.experimental.html
608
608
grain_worker_count: 1# Set to -1 to enable auto-tuning: automatically determines optimal worker count. See https://google-grain.readthedocs.io/en/latest/_autosummary/grain.experimental.pick_performance_config.html
609
609
grain_per_worker_buffer_size: 1
610
-
# num_threads and prefetch_buffer_size are per-worker per-dataset.
610
+
# num_threads and prefetch_buffer_size are per-worker per-dataset.
611
611
# When using array_records, they are used in ReadOptions (https://google-grain.readthedocs.io/en/latest/tutorials/data_loader_tutorial.html#per-worker-readoptions)
612
612
# The default value matches that in the Grain package. If mixing multiple data sources, consider lowering these values to reduce memory usage.
613
613
# When using parquet, grain_num_threads is the number of files to read and interleave in parallel
0 commit comments