Skip to content

Commit 8528118

Browse files
committed
Change the workload name to finewebedu everywhere to maintain uniformity.
1 parent b21be29 commit 8528118

5 files changed

Lines changed: 6 additions & 6 deletions

File tree

.github/workflows/regression_tests.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -116,7 +116,7 @@ jobs:
116116
- name: Run containerized workload
117117
run: |
118118
docker pull us-central1-docker.pkg.dev/training-algorithms-external/mlcommons-docker-repo/algoperf_jax_${{ github.head_ref || github.ref_name }}
119-
docker run -v $HOME/data/:/data/ -v $HOME/experiment_runs/:/experiment_runs -v $HOME/experiment_runs/logs:/logs --gpus all --ipc=host us-central1-docker.pkg.dev/training-algorithms-external/mlcommons-docker-repo/algoperf_jax_${{ github.head_ref || github.ref_name }} -d fineweb_edu_10B -f jax -s algorithms/archived_paper_baselines/adamw/jax/submission.py -w finewebedu_lm -t algorithms/archived_paper_baselines/adamw/tuning_search_space.json -e tests/regression_tests/adamw -m 10 -c False -o True -r false --data_bucket mlcommons-data --logs_bucket mlcommons-runs --data_bucket mlcommons-data --logs_bucket mlcommons-runs
119+
docker run -v $HOME/data/:/data/ -v $HOME/experiment_runs/:/experiment_runs -v $HOME/experiment_runs/logs:/logs --gpus all --ipc=host us-central1-docker.pkg.dev/training-algorithms-external/mlcommons-docker-repo/algoperf_jax_${{ github.head_ref || github.ref_name }} -d finewebedu -f jax -s algorithms/archived_paper_baselines/adamw/jax/submission.py -w finewebedu_lm -t algorithms/archived_paper_baselines/adamw/tuning_search_space.json -e tests/regression_tests/adamw -m 10 -c False -o True -r false --data_bucket mlcommons-data --logs_bucket mlcommons-runs --data_bucket mlcommons-data --logs_bucket mlcommons-runs
120120
fastmri_pytorch:
121121
runs-on: self-hosted
122122
needs: build_and_push_pytorch_docker_image
@@ -198,4 +198,4 @@ jobs:
198198
- name: Run containerized workload
199199
run: |
200200
docker pull us-central1-docker.pkg.dev/training-algorithms-external/mlcommons-docker-repo/algoperf_pytorch_${{ github.head_ref || github.ref_name }}
201-
docker run -v $HOME/data/:/data/ -v $HOME/experiment_runs/:/experiment_runs -v $HOME/experiment_runs/logs:/logs --gpus all --ipc=host us-central1-docker.pkg.dev/training-algorithms-external/mlcommons-docker-repo/algoperf_pytorch_${{ github.head_ref || github.ref_name }} -d fineweb_edu_10B -f pytorch -s algorithms/archived_paper_baselines/adamw/pytorch/submission.py -w finewebedu_lm -t algorithms/archived_paper_baselines/adamw/tuning_search_space.json -e tests/regression_tests/adamw -m 10 -c False -o True -r false --data_bucket mlcommons-data --logs_bucket mlcommons-runs --data_bucket mlcommons-data --logs_bucket mlcommons-runs
201+
docker run -v $HOME/data/:/data/ -v $HOME/experiment_runs/:/experiment_runs -v $HOME/experiment_runs/logs:/logs --gpus all --ipc=host us-central1-docker.pkg.dev/training-algorithms-external/mlcommons-docker-repo/algoperf_pytorch_${{ github.head_ref || github.ref_name }} -d finewebedu -f pytorch -s algorithms/archived_paper_baselines/adamw/pytorch/submission.py -w finewebedu_lm -t algorithms/archived_paper_baselines/adamw/tuning_search_space.json -e tests/regression_tests/adamw -m 10 -c False -o True -r false --data_bucket mlcommons-data --logs_bucket mlcommons-runs --data_bucket mlcommons-data --logs_bucket mlcommons-runs

dataset/dataset_setup.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -782,7 +782,7 @@ def download_finewebedu(
782782
):
783783
"""Download FineWebEdu-10B."""
784784

785-
data_dir = os.path.join(data_dir, 'fineweb_edu_10B')
785+
data_dir = os.path.join(data_dir, 'finewebedu')
786786
_maybe_mkdir(data_dir)
787787
_maybe_mkdir(tmp_dir)
788788

docker/scripts/startup.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -174,7 +174,7 @@ fi
174174

175175
# Check if arguments are valid
176176
VALID_DATASETS=("criteo1tb" "imagenet" "fastmri" "ogbg" "librispeech" \
177-
"wmt" "mnist" "fineweb_edu_10B")
177+
"wmt" "mnist" "finewebedu")
178178
VALID_WORKLOADS=("criteo1tb" "imagenet_resnet" "imagenet_resnet_silu" "imagenet_resnet_gelu" \
179179
"imagenet_resnet_large_bn_init" "imagenet_vit" "imagenet_vit_glu" \
180180
"imagenet_vit_post_ln" "imagenet_vit_map" "fastmri" "ogbg" \

scoring/utils/slurm/make_job_config.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -67,7 +67,7 @@
6767
'librispeech_deepspeech': {'dataset': 'librispeech'},
6868
'criteo1tb': {'dataset': 'criteo1tb'},
6969
'librispeech_conformer': {'dataset': 'librispeech'},
70-
'finewebedu_lm': {'dataset': 'fineweb_edu_10B'},
70+
'finewebedu_lm': {'dataset': 'finewebedu'},
7171
}
7272

7373
RULESET_CONFIGS = {

scoring/utils/workload_metadata_external_tuning.json

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -33,6 +33,6 @@
3333
},
3434
"finewebedu_lm" : {
3535
"max_steps": 55000,
36-
"dataset":"fineweb_edu_10B"
36+
"dataset":"finewebedu"
3737
}
3838
}

0 commit comments

Comments
 (0)