| #!/bin/bash |
|
|
| script_path=$(realpath $0) |
| script_dir=$(dirname $script_path) |
| main_dir=$(dirname $script_dir) |
|
|
| MP_SIZE=1 |
| |
| |
|
|
|
|
| SEED=12345 |
| MAX_GEN_LENGTH=128 |
| MIN_GEN_LENGTH=0 |
|
|
| |
| NUM_BEAMS=4 |
| LENGTH_PENALTY=1.0 |
| NO_REPEAT_NGRAM=0 |
|
|
| |
| TEMP=0.8 |
| TOPK=0 |
| TOPP=0.9 |
|
|
|
|
| PORT=19865 |
|
|
| MODEL_ARGS="--bf16 \ |
| --skip-init \ |
| --mode finetune \ |
| --rotary-embedding-2d" |
|
|
| |
|
|
| GENERATION_ARGS="--seed $SEED \ |
| --sampling-strategy BaseStrategy \ |
| --max-gen-length $MAX_GEN_LENGTH \ |
| --min-gen-length $MIN_GEN_LENGTH \ |
| --num-beams $NUM_BEAMS \ |
| --length-penalty $LENGTH_PENALTY \ |
| --no-repeat-ngram-size $NO_REPEAT_NGRAM \ |
| --multiline_stream \ |
| --temperature $TEMP \ |
| --top_k $TOPK \ |
| --top_p $TOPP |
| " |
| |
| |
|
|
|
|
| OPTIONS_NCCL="NCCL_DEBUG=VERSION NCCL_IB_DISABLE=0 NCCL_NET_GDR_LEVEL=2 CUDA_LAUNCH_BLOCKING=0" |
|
|
| ARGS="${main_dir}/cli_sat.py \ |
| $MODEL_ARGS \ |
| $GENERATION_ARGS \ |
| $*" |
|
|
| run_cmd="${OPTIONS_NCCL} torchrun --nproc_per_node $MP_SIZE --master_port=$PORT ${ARGS}" |
| echo ${run_cmd} |
| eval ${run_cmd} |
| set +x |