Skip to content
This repository was archived by the owner on Jul 7, 2023. It is now read-only.

Commit 9d86cf7

Browse files
author
Ryan Sepassi
committed
Add back commented-out enfr datasets
PiperOrigin-RevId: 173612759
1 parent 90aa796 commit 9d86cf7

File tree

1 file changed

+26
-0
lines changed

1 file changed

+26
-0
lines changed

tensor2tensor/data_generators/translate_enfr.py

Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -40,13 +40,39 @@
4040
("baseline-1M-enfr/baseline-1M_train.en",
4141
"baseline-1M-enfr/baseline-1M_train.fr")
4242
],
43+
# [
44+
# "http://www.statmt.org/wmt13/training-parallel-commoncrawl.tgz",
45+
# ("commoncrawl.fr-en.en", "commoncrawl.fr-en.fr")
46+
# ],
47+
# [
48+
# "http://www.statmt.org/wmt13/training-parallel-europarl-v7.tgz",
49+
# ("training/europarl-v7.fr-en.en", "training/europarl-v7.fr-en.fr")
50+
# ],
51+
# [
52+
# "http://www.statmt.org/wmt14/training-parallel-nc-v9.tgz",
53+
# ("training/news-commentary-v9.fr-en.en",
54+
# "training/news-commentary-v9.fr-en.fr")
55+
# ],
56+
# [
57+
# "http://www.statmt.org/wmt10/training-giga-fren.tar",
58+
# ("giga-fren.release2.fixed.en.gz",
59+
# "giga-fren.release2.fixed.fr.gz")
60+
# ],
61+
# [
62+
# "http://www.statmt.org/wmt13/training-parallel-un.tgz",
63+
# ("un/undoc.2000.fr-en.en", "un/undoc.2000.fr-en.fr")
64+
# ],
4365
]
4466
_ENFR_TEST_DATASETS = [
4567
[
4668
"https://s3.amazonaws.com/opennmt-trainingdata/baseline-1M-enfr.tgz",
4769
("baseline-1M-enfr/baseline-1M_valid.en",
4870
"baseline-1M-enfr/baseline-1M_valid.fr")
4971
],
72+
# [
73+
# "http://data.statmt.org/wmt17/translation-task/dev.tgz",
74+
# ("dev/newstest2013.en", "dev/newstest2013.fr")
75+
# ],
5076
]
5177

5278

0 commit comments

Comments
 (0)