export HTTP_PROXY=http://sys-proxy-rd-relay.byted.org:8118 export http_proxy=http://sys-proxy-rd-relay.byted.org:8118 export https_proxy=http://sys-proxy-rd-relay.byted.org:8118 export no_proxy="$no_proxy,.byteintl.net" export HF_ENDPOINT=https://hf-mirror.com cd quantization_metric/ model_id=/mnt/bn/life-mllm/users/cxr/quantization/models/Qwen/Qwen2.5-14B model_name=$(basename "$model_id") cuda_id=4 model=/mnt/bn/life-mllm/users/cxr/quantization/models/${model_name}-quantization-layer-mlp # output_dir=Alpha_values_mlp # bit_layers_dir=/mnt/bn/life-mllm/users/cxr/quantization/quantization_metric/bit_layers # result_dir=/mnt/bn/life-mllm/users/cxr/quantization/lm-evaluation-harness/results start=$(date +%s.%N) # rm -rf $model modes=("mlp") for mode in ${modes[@]}; do for idx in {32..47}; do echo $mode $idx cd ../quantization_metric python -u main.py --bit_layer_idx $idx --save_dir ${model} --mode $mode --model_id $model_id --cuda_id $cuda_id cd ../lm-evaluation-harness bash run_scripts/eval_base_qwen2_5_14b.sh ${model} ${mode}_${idx} rm -rf ${model} end=$(date +%s.%N) runtime=$(awk "BEGIN {print $end - $start}") echo "Execution time: $runtime seconds" done done model=/mnt/bn/life-mllm/users/cxr/quantization/models/${model_name}-quantization-layer start=$(date +%s.%N) # rm -rf $model modes=("self_attn") for mode in ${modes[@]}; do for idx in {32..47}; do echo $mode $idx cd ../quantization_metric python -u main.py --bit_layer_idx $idx --save_dir ${model} --mode $mode --model_id $model_id --cuda_id $cuda_id cd ../lm-evaluation-harness bash run_scripts/eval_base_qwen2_5_14b.sh ${model} ${mode}_${idx} rm -rf ${model} end=$(date +%s.%N) runtime=$(awk "BEGIN {print $end - $start}") echo "Execution time: $runtime seconds" done done