From 5b59fa33cfd295e3d0f8ca6d1aa2fa268c6ae1f2 Mon Sep 17 00:00:00 2001 From: Jenia Jitsev Date: Mon, 22 Dec 2025 14:27:43 +0100 Subject: [PATCH 1/3] Update simple_jureca.sbatch Updating compute budget account to the active one, westai0066 --- eval/distributed/simple_jureca.sbatch | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/eval/distributed/simple_jureca.sbatch b/eval/distributed/simple_jureca.sbatch index 7c1cbfe7..7708d262 100644 --- a/eval/distributed/simple_jureca.sbatch +++ b/eval/distributed/simple_jureca.sbatch @@ -4,7 +4,7 @@ #SBATCH --gres=gpu:4 #SBATCH --time={time_limit} #SBATCH --cpus-per-task=12 -#SBATCH --account=westai0007 +#SBATCH --account=westai0066 #SBATCH --partition=dc-hwai #SBATCH --job-name={job_name} #SBATCH --output={logs_dir}/%x_%j.out @@ -25,4 +25,4 @@ OUTPUT_DATASET={output_dataset} # RUN SHARDED INFERENCE srun --output={logs_dir}/%x_%j_%t.out bash -c 'echo -e "GLOBAL_SIZE: ${SLURM_STEP_NUM_TASKS}\nRANK: ${SLURM_PROCID}\nMODEL: '$MODEL_NAME'\nINPUT_DATASET: '$INPUT_DATASET'\nOUTPUT_DATASET: '$OUTPUT_DATASET'"' -srun --output={logs_dir}/%x_%j_%t.out bash -c 'CUDA_VISIBLE_DEVICES=${SLURM_LOCALID} python $EVALCHEMY/eval/distributed/process_shard.py --global_size ${SLURM_STEP_NUM_TASKS} --rank ${SLURM_PROCID} --input_dataset '${INPUT_DATASET}' --model_name '${MODEL_NAME}' --output_dataset '${OUTPUT_DATASET}'' \ No newline at end of file +srun --output={logs_dir}/%x_%j_%t.out bash -c 'CUDA_VISIBLE_DEVICES=${SLURM_LOCALID} python $EVALCHEMY/eval/distributed/process_shard.py --global_size ${SLURM_STEP_NUM_TASKS} --rank ${SLURM_PROCID} --input_dataset '${INPUT_DATASET}' --model_name '${MODEL_NAME}' --output_dataset '${OUTPUT_DATASET}'' From 93b19d49f23fd37c48a512ae28f224a8252ee4fb Mon Sep 17 00:00:00 2001 From: Jenia Jitsev Date: Mon, 22 Dec 2025 14:31:31 +0100 Subject: [PATCH 2/3] Update process_shards_jureca.sbatch Updating compute budget on hwai to the active one, westai0066 --- eval/distributed/process_shards_jureca.sbatch | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/eval/distributed/process_shards_jureca.sbatch b/eval/distributed/process_shards_jureca.sbatch index 77772dc4..8c2825d1 100644 --- a/eval/distributed/process_shards_jureca.sbatch +++ b/eval/distributed/process_shards_jureca.sbatch @@ -5,7 +5,7 @@ #SBATCH --gres=gpu:1 #SBATCH --time=01:00:00 #SBATCH --cpus-per-task=12 -#SBATCH --account=westai0007 +#SBATCH --account=westai0066 #SBATCH --partition=dc-hwai # ENVIRONMENT VARIABLES @@ -23,4 +23,4 @@ export OUTPUT_DATASET="$DCFT_DATA/evalchemy_results/${MODEL_NAME##*--}_${INPUT_D # RUN SHARDED INFERENCE srun echo -e "GLOBAL_SIZE: ${GLOBAL_SIZE}\nRANK: ${RANK}\nMODEL: ${MODEL_NAME}\nINPUT_DATASET: ${INPUT_DATASET}\nOUTPUT_DATASET: ${OUTPUT_DATASET}" -srun python $EVALCHEMY/eval/distributed/process_shard.py --global_size ${GLOBAL_SIZE} --rank ${RANK} --input_dataset ${INPUT_DATASET} --model_name ${MODEL_NAME} --output_dataset ${OUTPUT_DATASET} \ No newline at end of file +srun python $EVALCHEMY/eval/distributed/process_shard.py --global_size ${GLOBAL_SIZE} --rank ${RANK} --input_dataset ${INPUT_DATASET} --model_name ${MODEL_NAME} --output_dataset ${OUTPUT_DATASET} From 84b34a529f69d94b4cfd2629fd2b9eb67329a01c Mon Sep 17 00:00:00 2001 From: Jenia Jitsev Date: Mon, 22 Dec 2025 14:32:15 +0100 Subject: [PATCH 3/3] Update SETUP_JURECA.md Updating compute budget on hwai to the active one, westai0066 --- eval/distributed/SETUP_JURECA.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/eval/distributed/SETUP_JURECA.md b/eval/distributed/SETUP_JURECA.md index 5b7ff462..e96a4825 100644 --- a/eval/distributed/SETUP_JURECA.md +++ b/eval/distributed/SETUP_JURECA.md @@ -88,7 +88,7 @@ huggingface-cli download mlfoundations-dev/evalset_2870 --repo-type dataset huggingface-cli download open-thoughts/OpenThinker-7B # Request an interactive node for testing -salloc --nodes=1 --ntasks-per-node=1 --gres=gpu:1 --cpus-per-task=12 -p dc-hwai -A westai0007 +salloc --nodes=1 --ntasks-per-node=1 --gres=gpu:1 --cpus-per-task=12 -p dc-hwai -A westai0066 # Verify GPU is available srun bash -c 'nvidia-smi'