Skip to content

Commit

Permalink
Add WMT24 test sets
Browse files Browse the repository at this point in the history
  • Loading branch information
mjpost committed Jan 2, 2025
1 parent 0f35101 commit 245af68
Showing 1 changed file with 19 additions and 0 deletions.
19 changes: 19 additions & 0 deletions sacrebleu/dataset/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -74,6 +74,25 @@

DATASETS = {
# wmt
"wmt24": WMTXMLDataset(
"wmt24",
data=["https://github.com/wmt-conference/wmt24-news-systems/releases/download/v1.1/data_nots.tar.gz"],
description="WMT24 official test set release, v1.1 (excluding TS)",
md5=["35ea35f398190de3a17bcb9a08333b1b"],
langpairs={
"cs-uk": ["xml/wmttest2024.cs-uk.all.xml"],
"en-cs": ["xml/wmttest2024.en-cs.all.xml"],
"en-de": ["xml/wmttest2024.en-de.all.xml"],
"en-es": ["xml/wmttest2024.en-es.all.xml"],
"en-hi": ["xml/wmttest2024.en-hi.all.xml"],
"en-is": ["xml/wmttest2024.en-is.all.xml"],
"en-ja": ["xml/wmttest2024.en-ja.all.xml"],
"en-ru": ["xml/wmttest2024.en-ru.all.xml"],
"en-uk": ["xml/wmttest2024.en-uk.all.xml"],
"en-zh": ["xml/wmttest2024.en-zh.all.xml"],
"ja-zh": ["xml/wmttest2024.ja-zh.all.xml"],
},
),
"wmt23": WMTXMLDataset(
"wmt23",
data=["https://github.com/wmt-conference/wmt23-news-systems/archive/refs/tags/v.0.1.tar.gz"],
Expand Down

0 comments on commit 245af68

Please sign in to comment.