| export HTTP_PROXY=http://sys-proxy-rd-relay.byted.org:8118 |
| export http_proxy=http://sys-proxy-rd-relay.byted.org:8118 |
| export https_proxy=http://sys-proxy-rd-relay.byted.org:8118 |
| export no_proxy="$no_proxy,.byteintl.net" |
| export HF_ENDPOINT=https://hf-mirror.com |
|
|
|
|
| cd quantization_metric/ |
| model_id=/mnt/bn/life-mllm/users/cxr/quantization/models/Qwen/Qwen2.5-7B |
| model_name=$(basename "$model_id") |
|
|
| model=/mnt/bn/life-mllm/users/cxr/quantization/models/${model_name}-quantization-fg |
| |
| |
| |
|
|
| start=$(date +%s.%N) |
| |
| cd ../quantization_metric |
| |
| |
| |
|
|
|
|
| |
| |
| |
|
|
|
|
| |
| |
| |
|
|
|
|
|
|
| |
| |
| |
|
|
|
|
| |
| |
| |
|
|
| |
| |
| |
|
|
|
|
| save_fg=f6 |
| self_attn_layer_to_quant="4 1 2 8 23 22 25 5 24 7 26 6 20 12 19 17 21 11 10 9 18" |
| mlp_layer_to_quant="27 16 19" |
|
|
| python -u main_fg.py --cuda_id 6 --save_dir ${model} --model_id $model_id --self_attn_layer_to_quant "${self_attn_layer_to_quant}" --mlp_layer_to_quant "${mlp_layer_to_quant}" |
| cd ../lm-evaluation-harness |
| bash run_scripts/eval_base_fg.sh ${model} ${save_fg} |
| rm -rf ${model} |
| end=$(date +%s.%N) |
| runtime=$(awk "BEGIN {print $end - $start}") |
| echo "Execution time: $runtime seconds" |
|
|
|
|
|
|
| model_id=/mnt/bn/life-mllm/users/cxr/quantization/models/meta-llama/Llama-3.1-8B |
| model_name=$(basename "$model_id") |
|
|
| model=/mnt/bn/life-mllm/users/cxr/quantization/models/${model_name}-quantization-fg |
| |
| |
| |
|
|
| start=$(date +%s.%N) |
| |
| cd ../quantization_metric |
| |
| |
| |
| save_fg=fg6 |
| self_attn_layer_to_quant="29 23 24 30 18 28 26 20 16 27 25 17 19 21" |
| mlp_layer_to_quant="26 20 22" |
|
|
| python -u main_fg.py --cuda_id 6 --save_dir ${model} --model_id $model_id --self_attn_layer_to_quant "${self_attn_layer_to_quant}" --mlp_layer_to_quant "${mlp_layer_to_quant}" |
| cd ../lm-evaluation-harness |
| bash run_scripts/eval_base_fg.sh ${model} ${save_fg} |
| rm -rf ${model} |
| end=$(date +%s.%N) |
| runtime=$(awk "BEGIN {print $end - $start}") |
| echo "Execution time: $runtime seconds" |
|
|
|
|