quantization2 / lm-quant-toolkit /scripts /debug-milp-low-bit.sh
chen459664's picture
Add files using upload-large-folder tool
2051791 verified
#!/bin/bash
# BUDGETS="2.13 2.25 2.51 3.13 3.25 3.51 4.13 4.25 4.51"
# BUDGETS="4.17 4.29 4.56 4.21 4.34 4.60"
# BUDGETS="4.09 4.46"
# BUDGETS="4.25"
# BUDGETS="3.12 3.25 3.51"
BUDGETS="4.25"
RESULT_DIR="/fdata/llm/mxq/results"
QUANT_SNAPSHOT_DIR="/fdata/llm/mxq/snapshots"
FACTOR=2
ATTEMPT="ts-lowbit-mix-sensi"
EXP_BASE_NAME=$ATTEMPT
mkdir -p $RESULT_DIR/$EXP_BASE_NAME/data/{ppl,qnt,stor}
# Use cached dataset to speedup wikitext, c4 ppl evaluation
export HF_DATASETS_OFFLINE=1
weight_algo=sensi-milp
log_file="logs/bench-${ATTEMPT}-$(date +%Y%m%d%H%M%S).log"
mkdir -p $QUANT_SNAPSHOT_DIR/$ATTEMPT
mkdir -p $RESULT_DIR/${EXP_NAME}_ppl
mkdir -p $RESULT_DIR/$EXP_BASE_NAME/data/{ppl,stor}/mxq/$ATTEMPT
# MODELS="0 1 2"
MODELS="0"
EXP_NAME="${ATTEMPT}"
echo "=========Run perplexity evaluation========="
# python ../src/cli.py llm \
python -m pdb ../src/cli.py llm \
--task eval_ppl \
--model $MODELS \
--algo mxq \
--weight-algo $weight_algo \
--factor $FACTOR \
--config ${BUDGETS} \
--experiment-name "${EXP_NAME}_ppl" \
--quant-snapshot-dir="$QUANT_SNAPSHOT_DIR/$ATTEMPT" \
--result-dir=$RESULT_DIR \
2>&1 \
| tee -a $log_file
EXIT_CODE=$?
if [ $EXIT_CODE -ne 0 ]; then
echo "Perplexity evaluation failed!"
exit $EXIT_CODE
fi