Skip to content

Commit

Permalink
add missing is_train kwarg in tokenize_id
Browse files Browse the repository at this point in the history
  • Loading branch information
francoishernandez committed Jan 15, 2025
1 parent 7947a6b commit 928c6fe
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions eole/transforms/tokenize_id.py
Original file line number Diff line number Diff line change
Expand Up @@ -96,10 +96,10 @@ def tokenize_string(self, string, side="src", is_train=False):
return tokens

def apply(self, example, is_train=False, stats=None, **kwargs):
src_tokens = self.tokenize_string(" ".join(example["src"]), side="src")
src_tokens = self.tokenize_string(" ".join(example["src"]), side="src", is_train=is_train)
example["src_ids"] = src_tokens
if example.get("tgt", None) is not None:
tgt_tokens = self.tokenize_string(" ".join(example["tgt"]), side="tgt")
tgt_tokens = self.tokenize_string(" ".join(example["tgt"]), side="tgt", is_train=is_train)
example["tgt_ids"] = tgt_tokens
return example

Expand Down

0 comments on commit 928c6fe

Please sign in to comment.