Skip to content

Commit f196311

Browse files
committed
fix: remove hardcoded GPU bind
1 parent 9b107a0 commit f196311

4 files changed

Lines changed: 4 additions & 4 deletions

File tree

training/DeepSpeed-SuperOffload/finetune_gpt-oss-20b_1gpu.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -104,7 +104,7 @@ fi
104104
# Set number of GPUs
105105
GPUS_PER_NODE=1
106106

107-
CMD="CUDA_VISIBLE_DEVICES=1 deepspeed --bind_cores_to_rank --bind_core_list 72-143 finetune_zero3.py \
107+
CMD="deepspeed --num_gpus=$GPUS_PER_NODE finetune_zero3.py \
108108
--deepspeed_config=$DS_CONFIG_JSON \
109109
--model_name $MODEL_NAME \
110110
--leaf_module "GptOssExperts" \

training/DeepSpeed-SuperOffload/finetune_llama-8b_1gpu.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -103,7 +103,7 @@ fi
103103

104104
GPUS_PER_NODE=1
105105

106-
CMD="CUDA_VISIBLE_DEVICES=1 deepspeed --bind_cores_to_rank --bind_core_list 72-143 finetune_zero3.py \
106+
CMD="deepspeed --num_gpus=$GPUS_PER_NODE finetune_zero3.py \
107107
--deepspeed_config=$DS_CONFIG_JSON \
108108
--model_name $MODEL_NAME \
109109
--num_train_epochs $EPOCHS \

training/DeepSpeed-SuperOffload/finetune_phi-4_1gpu.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -103,7 +103,7 @@ fi
103103

104104
GPUS_PER_NODE=1
105105

106-
CMD="CUDA_VISIBLE_DEVICES=1 deepspeed --bind_cores_to_rank --bind_core_list 72-143 finetune_zero3.py \
106+
CMD="deepspeed --num_gpus=$GPUS_PER_NODE finetune_zero3.py \
107107
--deepspeed_config=$DS_CONFIG_JSON \
108108
--model_name $MODEL_NAME \
109109
--num_train_epochs $EPOCHS \

training/DeepSpeed-SuperOffload/finetune_qwen3-14b_1gpu.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -103,7 +103,7 @@ fi
103103

104104
GPUS_PER_NODE=1
105105

106-
CMD="CUDA_VISIBLE_DEVICES=1 deepspeed --bind_cores_to_rank --bind_core_list 72-143 finetune_zero3.py \
106+
CMD="deepspeed --num_gpus=$GPUS_PER_NODE finetune_zero3.py \
107107
--deepspeed_config=$DS_CONFIG_JSON \
108108
--model_name $MODEL_NAME \
109109
--num_train_epochs $EPOCHS \

0 commit comments

Comments
 (0)