This repository was archived by the owner on Jul 7, 2023. It is now read-only.
File tree Expand file tree Collapse file tree 2 files changed +3
-3
lines changed Expand file tree Collapse file tree 2 files changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -356,7 +356,7 @@ def generate_data_for_problem(problem):
356356
357357def generate_data_for_registered_problem (problem_name ):
358358 problem = registry .problem (problem_name )
359- problem .generate_data (FLAGS .data_dir , FLAGS .tmp_dir )
359+ problem .generate_data (FLAGS .data_dir , FLAGS .tmp_dir , FLAGS . num_shards )
360360
361361
362362if __name__ == "__main__" :
Original file line number Diff line number Diff line change @@ -49,10 +49,10 @@ def target_vocab_size(self):
4949 def feature_encoders (self , data_dir ):
5050 return _default_wmt_feature_encoders (data_dir , self .target_vocab_size )
5151
52- def generate_data (self , data_dir , tmp_dir ):
52+ def generate_data (self , data_dir , tmp_dir , num_shards = 100 ):
5353 generator_utils .generate_dataset_and_shuffle (
5454 ende_wordpiece_token_generator (tmp_dir , True , self .target_vocab_size ),
55- self .training_filepaths (data_dir , 100 , shuffled = False ),
55+ self .training_filepaths (data_dir , num_shards , shuffled = False ),
5656 ende_wordpiece_token_generator (tmp_dir , False , self .target_vocab_size ),
5757 self .dev_filepaths (data_dir , 1 , shuffled = False ))
5858
You can’t perform that action at this time.
0 commit comments