Skip to content
This repository was archived by the owner on Jul 7, 2023. It is now read-only.

Commit 31f5dfa

Browse files
committed
Clear comment, add sanity check, change algorithmic_reverse_nlplike max_length and add __pycache__ entry in .gitignore
1 parent 759789b commit 31f5dfa

File tree

3 files changed

+16
-9
lines changed

3 files changed

+16
-9
lines changed

.gitignore

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,7 @@
11
# Compiled python modules.
22
*.pyc
3+
# Byte-compiled
4+
__pycache__/
35

46
# Python egg metadata, regenerated from source files by setuptools.
57
/*.egg-info

tensor2tensor/bin/t2t-datagen

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -87,15 +87,15 @@ _SUPPORTED_PROBLEM_GENERATORS = {
8787
lambda: algorithmic.multiplication_generator(10, 40, 100000),
8888
lambda: algorithmic.multiplication_generator(10, 400, 10000)),
8989
"algorithmic_reverse_nlplike_decimal8K": (
90-
lambda: algorithmic.reverse_generator_nlplike(8000, 40, 100000,
91-
10, 1.250),
92-
lambda: algorithmic.reverse_generator_nlplike(8000, 400, 10000,
93-
10, 1.250)),
90+
lambda: algorithmic.reverse_generator_nlplike(8000, 70, 100000,
91+
10, 1.300),
92+
lambda: algorithmic.reverse_generator_nlplike(8000, 700, 10000,
93+
10, 1.300)),
9494
"algorithmic_reverse_nlplike_decimal32K": (
95-
lambda: algorithmic.reverse_generator_nlplike(32000, 40, 100000,
96-
10, 1.005),
97-
lambda: algorithmic.reverse_generator_nlplike(32000, 400, 10000,
98-
10, 1.005)),
95+
lambda: algorithmic.reverse_generator_nlplike(32000, 70, 100000,
96+
10, 1.050),
97+
lambda: algorithmic.reverse_generator_nlplike(32000, 700, 10000,
98+
10, 1.050)),
9999
"algorithmic_algebra_inverse": (
100100
lambda: algorithmic_math.algebra_inverse(26, 0, 2, 100000),
101101
lambda: algorithmic_math.algebra_inverse(26, 3, 3, 10000)),

tensor2tensor/data_generators/algorithmic.py

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -123,7 +123,12 @@ def zipf_random_sample(distr_map, sample_len):
123123
124124
"""
125125
u = np.random.random(sample_len)
126-
return [t+1 for t in np.searchsorted(distr_map, u)] # 0 pad and 1 EOS
126+
# Random produces values in range [0.0,1.0); even if it is almost
127+
# improbable(but possible) that it can generate a clear 0.000..0,
128+
# we have made a sanity check to overcome this issue. On the other hand,
129+
# t+1 is enough from saving us to generate PAD(0) and EOS(1) which are
130+
# reservated symbols.
131+
return [t+1 if t > 0 else t+2 for t in np.searchsorted(distr_map, u)]
127132

128133

129134
def reverse_generator_nlplike(nbr_symbols, max_length, nbr_cases, \

0 commit comments

Comments
 (0)