You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
# Each data-loading host will load per_device_batch_size * expansion_factor_real_data.
531
531
# When set to between 0 and 1, it's for grain pipeline to use a smaller chip count to read checkpoint from a larger chip count job.
532
532
# Details in https://github.com/AI-Hypercomputer/maxtext/blob/main/docs/guides/data_input_grain.md#using-grain
533
-
expansion_factor_real_data: -1.0
533
+
expansion_factor_real_data: -1.0
534
534
eval_per_device_batch_size: 0.0
535
535
max_corpus_chars: 10_000_000
536
536
train_data_columns: ['text'] # for DPO dataset containing "chosen" and "rejected"
@@ -595,14 +595,15 @@ grain_train_files: ''
595
595
grain_eval_files: ''
596
596
grain_train_mixture_config_path: ''# Path to a JSON file specifying the mixture weights for Grain training data.
597
597
grain_file_type: 'arrayrecord'# arrayrecord or parquet
598
-
grain_worker_count: 1
598
+
grain_worker_count: 1# Set to -1 to enable auto-tuning: automatically determines optimal worker count. See https://google-grain.readthedocs.io/en/latest/_autosummary/grain.experimental.pick_performance_config.html
599
599
grain_per_worker_buffer_size: 1
600
600
# num_threads and prefetch_buffer_size are per-worker per-dataset. Used in ReadOptions (https://google-grain.readthedocs.io/en/latest/tutorials/data_loader_tutorial.html#per-worker-readoptions)
601
601
# The default value matches that in the Grain package. If mixing multiple data sources, consider lowering these values to reduce memory usage.
602
-
grain_num_threads: 16
602
+
grain_num_threads: 16
603
603
grain_prefetch_buffer_size: 500
604
604
grain_worker_count_eval: 1
605
605
grain_per_worker_buffer_size_eval: 1
606
+
grain_ram_budget_mb: 1024# RAM budget (MB) for auto-tuning worker count. Only used when grain_worker_count is -1.
606
607
grain_num_threads_eval: 16
607
608
grain_prefetch_buffer_size_eval: 500
608
609
grain_data_source_max_workers: 16# Max workers for ThreadPoolExecutor when mixing multiple Grain data sources.
0 commit comments