DeepSpeedExamples/MoQ/run.sh at master · DistributedDeepLearning/DeepSpeedExamples

42 lines (35 loc) · 768 Bytes

MASTER_PORT=12345
for TSK in qnli #stsb mrpc cola wnli sst2 rte qnli qqp mnli
if [ $TSK == wnli ] || [ $TSK == mrpc ]
    EPOCH_NUM=5
    EPOCH_NUM=3
if [ $TSK == qqp ] || [ $TSK == mnli ]
    TEST_JSON=test_long.json
    TEST_JSON=test.json
PORT=$((MASTER_PORT+GPU))
rm -rvf ./$OOO/${TSK}
CUDA_VISIBLE_DEVICES=$GPU python -m torch.distributed.launch \
  --master_port $PORT \
  --nproc_per_node 1 run_glue.py \
  --model_name_or_path bert-base-cased \
  --task_name $TSK \
  --do_train \
  --do_eval \
  --max_seq_length 128 \
  --per_device_train_batch_size 32 \
  --learning_rate 2e-5 \
  --num_train_epochs $EPOCH_NUM \
  --output_dir ./$OOO/$TSK/ \
  --warmup_steps 2 \
  --deepspeed test.json

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

run.sh

Latest commit

History

run.sh

File metadata and controls