Skip to content

Commit 6a3ff16

Browse files
Merge pull request #735 from mlcommons/dev
Dev -> main
2 parents 8bd3876 + e494956 commit 6a3ff16

File tree

8 files changed

+48
-30
lines changed

8 files changed

+48
-30
lines changed

CHANGELOG.md

Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,23 @@
11
# Change Log
22

3+
## algoperf-benchmark-0.1.4 (2024-03-26)
4+
5+
Upgrade CUDA version to CUDA 12.1:
6+
- Upgrade CUDA version in Dockerfiles that will be used for scoring.
7+
- Update Jax and PyTorch package version tags to use local CUDA installation.
8+
9+
Add flag for completely disabling checkpointing.
10+
- Note that we will run with checkpointing off at scoring time.
11+
12+
Update Deepspeech and Conformer variant target setting configurations.
13+
- Note that variant targets are not final.
14+
15+
Fixed bug in scoring code to take best trial in a study for external-tuning ruleset.
16+
17+
Added instructions for submission.
18+
19+
Changed default number of workers for PyTorch data loaders to 0. Running with >0 may lead to incorrect eval results see https://github.com/mlcommons/algorithmic-efficiency/issues/732.
20+
321
## algoperf-benchmark-0.1.2 (2024-03-04)
422
Workload variant additions and fixes:
523
- Add Deepspeech workload variant
Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,27 +1,27 @@
11
{
22
"learning_rate": {
33
"feasible_points": [
4-
0.001308209823469072
4+
0.0007852999990476642
55
]
66
},
77
"beta1": {
88
"feasible_points": [
9-
0.9731333693827139
9+
0.6994142393023162
1010
]
1111
},
1212
"beta2": {
1313
"feasible_points": [
14-
0.9981232922116359
14+
0.9918636824608852
1515
]
1616
},
1717
"warmup_steps": {
1818
"feasible_points": [
19-
9999
19+
6000
2020
]
2121
},
2222
"weight_decay": {
2323
"feasible_points": [
24-
0.16375311233774334
24+
0.07286322158086678
2525
]
2626
}
2727
}
Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,17 +1,17 @@
11
{
22
"learning_rate": {
33
"feasible_points": [
4-
0.001308209823469072
4+
0.000590120167916659
55
]
66
},
77
"beta1": {
88
"feasible_points": [
9-
0.9731333693827139
9+
0.737199286155609
1010
]
1111
},
1212
"beta2": {
1313
"feasible_points": [
14-
0.9981232922116359
14+
0.05919391544031072
1515
]
1616
},
1717
"warmup_steps": {
@@ -21,7 +21,7 @@
2121
},
2222
"weight_decay": {
2323
"feasible_points": [
24-
0.16375311233774334
24+
0.14128519778326312
2525
]
2626
}
2727
}
Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,27 +1,27 @@
11
{
22
"learning_rate": {
33
"feasible_points": [
4-
0.001308209823469072
4+
0.0014446807792420305
55
]
66
},
77
"beta1": {
88
"feasible_points": [
9-
0.9731333693827139
9+
0.7427148812902895
1010
]
1111
},
1212
"beta2": {
1313
"feasible_points": [
14-
0.9981232922116359
14+
0.8993064520764248
1515
]
1616
},
1717
"warmup_steps": {
1818
"feasible_points": [
19-
9999
19+
3000
2020
]
2121
},
2222
"weight_decay": {
2323
"feasible_points": [
24-
0.16375311233774334
24+
0.06875136511682291
2525
]
2626
}
2727
}
Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,27 +1,27 @@
11
{
22
"learning_rate": {
33
"feasible_points": [
4-
0.0035278622506232458
4+
0.0020162740358935045
55
]
66
},
77
"beta1": {
88
"feasible_points": [
9-
0.8192305396005781
9+
0.9604907112078142
1010
]
1111
},
1212
"beta2": {
1313
"feasible_points": [
14-
0.495850879212151
14+
0.8765457000160508
1515
]
1616
},
1717
"warmup_steps": {
1818
"feasible_points": [
19-
6000
19+
3600
2020
]
2121
},
2222
"weight_decay": {
2323
"feasible_points": [
24-
0.04339748256184769
24+
0.0006149579248633481
2525
]
2626
}
2727
}
Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,27 +1,27 @@
11
{
22
"learning_rate": {
33
"feasible_points": [
4-
0.001308209823469072
4+
0.0014446807792420305
55
]
66
},
77
"beta1": {
88
"feasible_points": [
9-
0.9731333693827139
9+
0.7427148812902895
1010
]
1111
},
1212
"beta2": {
1313
"feasible_points": [
14-
0.9981232922116359
14+
0.8993064520764248
1515
]
1616
},
1717
"warmup_steps": {
1818
"feasible_points": [
19-
6000
19+
1800
2020
]
2121
},
2222
"weight_decay": {
2323
"feasible_points": [
24-
0.16375311233774334
24+
0.06875136511682291
2525
]
2626
}
2727
}
Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -1,27 +1,27 @@
11
{
22
"learning_rate": {
33
"feasible_points": [
4-
0.003632312571224348
4+
0.003604759885558324
55
]
66
},
77
"beta1": {
88
"feasible_points": [
9-
0.9980088784197237
9+
0.9931094324430452
1010
]
1111
},
1212
"beta2": {
1313
"feasible_points": [
14-
0.9982275351621527
14+
0.9976871843749077
1515
]
1616
},
1717
"warmup_steps": {
1818
"feasible_points": [
19-
6000
19+
720
2020
]
2121
},
2222
"weight_decay": {
2323
"feasible_points": [
24-
0.2479797019098727
24+
0.120077307855989
2525
]
2626
}
2727
}

utils/workload_config.json renamed to utils/target_setting_workload_config.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -176,7 +176,7 @@
176176
"librispeech_conformer_attention_temperature": {
177177
"max_steps": 80000,
178178
"dataset": "librispeech",
179-
"submission_path": "reference_algorithms/target_setting_algorithms/jax_nadamw.py",
179+
"submission_path": "reference_algorithms/target_setting_algorithms/jax_adamw.py",
180180
"tuning_search_space": "reference_algorithms/target_setting_algorithms/librispeech_conformer_attention_temperature/tuning_search_space.json"
181181
},
182182
"librispeech_conformer_gelu": {

0 commit comments

Comments
 (0)