|
40 | 40 | ("baseline-1M-enfr/baseline-1M_train.en",
|
41 | 41 | "baseline-1M-enfr/baseline-1M_train.fr")
|
42 | 42 | ],
|
| 43 | + # [ |
| 44 | + # "http://www.statmt.org/wmt13/training-parallel-commoncrawl.tgz", |
| 45 | + # ("commoncrawl.fr-en.en", "commoncrawl.fr-en.fr") |
| 46 | + # ], |
| 47 | + # [ |
| 48 | + # "http://www.statmt.org/wmt13/training-parallel-europarl-v7.tgz", |
| 49 | + # ("training/europarl-v7.fr-en.en", "training/europarl-v7.fr-en.fr") |
| 50 | + # ], |
| 51 | + # [ |
| 52 | + # "http://www.statmt.org/wmt14/training-parallel-nc-v9.tgz", |
| 53 | + # ("training/news-commentary-v9.fr-en.en", |
| 54 | + # "training/news-commentary-v9.fr-en.fr") |
| 55 | + # ], |
| 56 | + # [ |
| 57 | + # "http://www.statmt.org/wmt10/training-giga-fren.tar", |
| 58 | + # ("giga-fren.release2.fixed.en.gz", |
| 59 | + # "giga-fren.release2.fixed.fr.gz") |
| 60 | + # ], |
| 61 | + # [ |
| 62 | + # "http://www.statmt.org/wmt13/training-parallel-un.tgz", |
| 63 | + # ("un/undoc.2000.fr-en.en", "un/undoc.2000.fr-en.fr") |
| 64 | + # ], |
43 | 65 | ]
|
44 | 66 | _ENFR_TEST_DATASETS = [
|
45 | 67 | [
|
46 | 68 | "https://s3.amazonaws.com/opennmt-trainingdata/baseline-1M-enfr.tgz",
|
47 | 69 | ("baseline-1M-enfr/baseline-1M_valid.en",
|
48 | 70 | "baseline-1M-enfr/baseline-1M_valid.fr")
|
49 | 71 | ],
|
| 72 | + # [ |
| 73 | + # "http://data.statmt.org/wmt17/translation-task/dev.tgz", |
| 74 | + # ("dev/newstest2013.en", "dev/newstest2013.fr") |
| 75 | + # ], |
50 | 76 | ]
|
51 | 77 |
|
52 | 78 |
|
|
0 commit comments