| | #!/bin/bash |
| |
|
| | script_path=$(realpath $0) |
| | script_dir=$(dirname $script_path) |
| | main_dir=$(dirname $script_dir) |
| |
|
| | MP_SIZE=1 |
| | |
| | |
| |
|
| |
|
| | SEED=12345 |
| | MAX_GEN_LENGTH=128 |
| | MIN_GEN_LENGTH=0 |
| |
|
| | |
| | NUM_BEAMS=4 |
| | LENGTH_PENALTY=1.0 |
| | NO_REPEAT_NGRAM=0 |
| |
|
| | |
| | TEMP=0.8 |
| | TOPK=0 |
| | TOPP=0.9 |
| |
|
| |
|
| | PORT=19865 |
| |
|
| | MODEL_ARGS="--bf16 \ |
| | --skip-init \ |
| | --mode finetune \ |
| | --rotary-embedding-2d" |
| |
|
| | |
| |
|
| | GENERATION_ARGS="--seed $SEED \ |
| | --sampling-strategy BaseStrategy \ |
| | --max-gen-length $MAX_GEN_LENGTH \ |
| | --min-gen-length $MIN_GEN_LENGTH \ |
| | --num-beams $NUM_BEAMS \ |
| | --length-penalty $LENGTH_PENALTY \ |
| | --no-repeat-ngram-size $NO_REPEAT_NGRAM \ |
| | --multiline_stream \ |
| | --temperature $TEMP \ |
| | --top_k $TOPK \ |
| | --top_p $TOPP |
| | " |
| | |
| | |
| |
|
| |
|
| | OPTIONS_NCCL="NCCL_DEBUG=VERSION NCCL_IB_DISABLE=0 NCCL_NET_GDR_LEVEL=2 CUDA_LAUNCH_BLOCKING=0" |
| |
|
| | ARGS="${main_dir}/cli_sat.py \ |
| | $MODEL_ARGS \ |
| | $GENERATION_ARGS \ |
| | $*" |
| |
|
| | run_cmd="${OPTIONS_NCCL} torchrun --nproc_per_node $MP_SIZE --master_port=$PORT ${ARGS}" |
| | echo ${run_cmd} |
| | eval ${run_cmd} |
| | set +x |