Spaces:
Running
on
Zero
Running
on
Zero
NUM_MACHINES=1 | |
NUM_LOCAL_GPUS=8 | |
MACHINE_RANK=0 | |
MAIN_MACHINE_IP="" # fill your machine IP here | |
MAIN_MACHINE_PROT="" # fill your machine port here | |
FILE=$1 | |
CONFIG_FILE=$2 | |
TAG=$3 | |
shift 3 # remove $1~$3 for $@ | |
# export HF_ENDPOINT=https://hf-mirror.com | |
export HF_HOME=~/.cache/huggingface | |
export TORCH_HOME=~/.cache/torch | |
export NCCL_DEBUG=VERSION | |
accelerate launch \ | |
--num_machines $NUM_MACHINES \ | |
--num_processes $(( $NUM_MACHINES * $NUM_LOCAL_GPUS )) \ | |
--machine_rank $MACHINE_RANK \ | |
--main_process_ip $MAIN_MACHINE_IP \ | |
--main_process_port $MAIN_MACHINE_PROT \ | |
${FILE} \ | |
--config_file ${CONFIG_FILE} \ | |
--tag ${TAG} \ | |
--pin_memory \ | |
--allow_tf32 \ | |
$@ | |