File tree Expand file tree Collapse file tree
training/DeepSpeed-SuperOffload Expand file tree Collapse file tree Original file line number Diff line number Diff line change 104104# Set number of GPUs
105105GPUS_PER_NODE=1
106106
107- CMD=" CUDA_VISIBLE_DEVICES=1 deepspeed --bind_cores_to_rank --bind_core_list 72-143 finetune_zero3.py \
107+ CMD=" deepspeed --num_gpus= $GPUS_PER_NODE finetune_zero3.py \
108108 --deepspeed_config=$DS_CONFIG_JSON \
109109 --model_name $MODEL_NAME \
110110 --leaf_module " GptOssExperts" \
Original file line number Diff line number Diff line change 103103
104104GPUS_PER_NODE=1
105105
106- CMD=" CUDA_VISIBLE_DEVICES=1 deepspeed --bind_cores_to_rank --bind_core_list 72-143 finetune_zero3.py \
106+ CMD=" deepspeed --num_gpus= $GPUS_PER_NODE finetune_zero3.py \
107107 --deepspeed_config=$DS_CONFIG_JSON \
108108 --model_name $MODEL_NAME \
109109 --num_train_epochs $EPOCHS \
Original file line number Diff line number Diff line change 103103
104104GPUS_PER_NODE=1
105105
106- CMD=" CUDA_VISIBLE_DEVICES=1 deepspeed --bind_cores_to_rank --bind_core_list 72-143 finetune_zero3.py \
106+ CMD=" deepspeed --num_gpus= $GPUS_PER_NODE finetune_zero3.py \
107107 --deepspeed_config=$DS_CONFIG_JSON \
108108 --model_name $MODEL_NAME \
109109 --num_train_epochs $EPOCHS \
Original file line number Diff line number Diff line change 103103
104104GPUS_PER_NODE=1
105105
106- CMD=" CUDA_VISIBLE_DEVICES=1 deepspeed --bind_cores_to_rank --bind_core_list 72-143 finetune_zero3.py \
106+ CMD=" deepspeed --num_gpus= $GPUS_PER_NODE finetune_zero3.py \
107107 --deepspeed_config=$DS_CONFIG_JSON \
108108 --model_name $MODEL_NAME \
109109 --num_train_epochs $EPOCHS \
You can’t perform that action at this time.
0 commit comments