diff options
author | MoonFighter <MoonFighter@users.noreply.github.com> | 2021-09-16 12:47:19 +0300 |
---|---|---|
committer | GitHub <noreply@github.com> | 2021-09-16 12:47:19 +0300 |
commit | 8d6a6977ec6b05c5a4a6c710732c283a0f845673 (patch) | |
tree | c0b5fde928114018e0898aa8755455e9dc7d7b02 | |
parent | 9f5abd1cea8915f4d6cc74d8a68791acd6f5acc1 (diff) |
fix a bug which results in wrong indices in reader (#2100)
-rw-r--r-- | onmt/inputters/text_dataset.py | 6 |
1 files changed, 3 insertions, 3 deletions
diff --git a/onmt/inputters/text_dataset.py b/onmt/inputters/text_dataset.py index a55d2593..98e8f1f7 100644 --- a/onmt/inputters/text_dataset.py +++ b/onmt/inputters/text_dataset.py @@ -36,16 +36,16 @@ class TextDataReader(DataReaderBase): if isinstance(v, str): features_values.append(DataReaderBase._read_file(features)) else: - features_values.append(v) + features_values.append(v) for i, (seq, *feats) in enumerate(zip(sequences, *features_values)): ex_dict = {} if isinstance(seq, bytes): seq = seq.decode("utf-8") ex_dict[side] = seq - for i, f in enumerate(feats): + for j, f in enumerate(feats): if isinstance(f, bytes): f = f.decode("utf-8") - ex_dict[features_names[i]] = f + ex_dict[features_names[j]] = f yield {side: ex_dict, "indices": i} |