Skip to content
This repository was archived by the owner on Jul 7, 2023. It is now read-only.

Commit b3de49a

Browse files
Larger source vocab; adapt to new upstream version
1 parent accf019 commit b3de49a

File tree

1 file changed

+4
-4
lines changed

1 file changed

+4
-4
lines changed

tensor2tensor/ice_parsing/ice_parsing.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -66,7 +66,7 @@ class IceParsingTokens(problem.Problem):
6666

6767
@property
6868
def source_vocab_size(self):
69-
return 2**13 # 8192
69+
return 2**14 # 16384
7070

7171
@property
7272
def target_vocab_size(self):
@@ -84,18 +84,18 @@ def feature_encoders(self, data_dir):
8484
"targets": target_subtokenizer,
8585
}
8686

87-
def generate_data(self, data_dir, tmp_dir, num_shards=100):
87+
def generate_data(self, data_dir, tmp_dir, task_id=-1):
8888
generator_utils.generate_dataset_and_shuffle(
8989
tabbed_parsing_token_generator(data_dir, tmp_dir, True, "ice",
9090
self.source_vocab_size,
9191
self.target_vocab_size),
92-
self.training_filepaths(data_dir, num_shards, shuffled=False),
92+
self.training_filepaths(data_dir, 1, shuffled=False),
9393
tabbed_parsing_token_generator(data_dir, tmp_dir, False, "ice",
9494
self.source_vocab_size,
9595
self.target_vocab_size),
9696
self.dev_filepaths(data_dir, 1, shuffled=False))
9797

98-
def hparams(self, defaults, unused_model_hparams):
98+
def hparams(self, defaults, model_hparams):
9999
p = defaults
100100
source_vocab_size = self._encoders["inputs"].vocab_size
101101
p.input_modality = {"inputs": (registry.Modalities.SYMBOL, source_vocab_size)}

0 commit comments

Comments
 (0)