Skip to content

Commit 6c3e1aa

Browse files
committed
milestone1: naive_intNwo + eval/benchmark
1 parent 5787e9e commit 6c3e1aa

File tree

12 files changed

+848
-0
lines changed

12 files changed

+848
-0
lines changed
Lines changed: 22 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,22 @@
1+
#!/bin/bash
2+
3+
GPUS=(0 1 2 3 4 5)
4+
5+
CONFIGS1=("2" "3" "4" "5" "6" "8")
6+
7+
PYTHON_SCRIPT="scripts/sensitivity_study.py"
8+
9+
for LAYER in {0..31}; do
10+
for i in "${!GPUS[@]}"; do
11+
GPU="${GPUS[$i]}"
12+
CONFIG1="${CONFIGS1[$i]}"
13+
14+
LOG_FILE="Sensi_${LAYER}_${CONFIG1}.txt"
15+
16+
CUDA_VISIBLE_DEVICES=$GPU python $PYTHON_SCRIPT --repo_id=checkpoints/meta-llama/Meta-Llama-3-8B --quantization=$CONFIG1 --layer=$LAYER &>"$LOG_FILE" &
17+
done
18+
19+
wait
20+
done
21+
22+
echo "All processes are complete."
Lines changed: 30 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,30 @@
1+
#!/bin/bash
2+
3+
# List of GPUs to use
4+
GPUS=(0 1 2 3 4 5)
5+
6+
# List of configuration files
7+
CONFIGS1=(8 8 8 8 8 16)
8+
CONFIGS2=(6 5 4 3 2 8)
9+
10+
#CONFIGS1=(16 16 16 16 16)
11+
#CONFIGS2=(6 5 4 3 2)
12+
13+
#CONFIGS1=(5 5 5 6 6 6 6 3)
14+
#CONFIGS2=(4 3 2 5 4 3 2 2)
15+
16+
PYTHON_SCRIPT="scripts/mp_quant_eval.py"
17+
18+
for i in "${!GPUS[@]}"; do
19+
GPU="${GPUS[$i]}"
20+
CONFIG1="${CONFIGS1[$i]}"
21+
CONFIG2="${CONFIGS2[$i]}"
22+
23+
LOG_FILE="MP_${CONFIG1}_${CONFIG2}.txt"
24+
25+
CUDA_VISIBLE_DEVICES=$GPU python $PYTHON_SCRIPT --repo_id=checkpoints/meta-llama/Meta-Llama-3-8B --quantization=MP_llama3 --sensi_bit=$CONFIG1 --non_sensi_bit=$CONFIG2 &>"$LOG_FILE" &
26+
done
27+
28+
wait
29+
30+
echo "All processes are complete."
Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,9 @@
1+
#!/bin/bash
2+
3+
PYTHON_SCRIPT="scripts/generate.py"
4+
python $PYTHON_SCRIPT --checkpoint_path=checkpoints/meta-llama/Meta-Llama-3-8B/model.pth --compile --quantization=MP_llama3 --sensi_bit=5 --non_sensi_bit=4 --write_result mp_quant_benchmark_results.txt
5+
python $PYTHON_SCRIPT --checkpoint_path=checkpoints/meta-llama/Meta-Llama-3-8B/model.pth --compile --quantization=MP_llama3 --sensi_bit=4 --non_sensi_bit=3 --write_result mp_quant_benchmark_results.txt
6+
python $PYTHON_SCRIPT --checkpoint_path=checkpoints/meta-llama/Meta-Llama-3-8B/model.pth --compile --quantization=MP_llama3 --sensi_bit=5 --non_sensi_bit=3 --write_result mp_quant_benchmark_results.txt
7+
8+
9+
echo "All processes are complete."
Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,26 @@
1+
#!/bin/bash
2+
3+
CONFIGS1=("q_proj" "k_proj" "v_proj" "o_proj" "gate_proj" "up_proj" "down_proj")
4+
CONFIGS2=("2" "3" "4" "5" "6" "8")
5+
6+
PYTHON_SCRIPT="scripts/sensitivity_study.py"
7+
8+
GPUS=(0 1 2 3 4 5)
9+
10+
for i in "${!CONFIGS1[@]}"; do
11+
CONFIG1="${CONFIGS1[$i]}"
12+
13+
for j in "${!CONFIGS2[@]}"; do
14+
CONFIG2="${CONFIGS2[$j]}"
15+
GPU="${GPUS[$j]}"
16+
17+
LOG_FILE="Sensi_skipsensi_${CONFIG1}_${CONFIG2}.txt"
18+
19+
CUDA_VISIBLE_DEVICES=$GPU python $PYTHON_SCRIPT --repo_id=checkpoints/meta-llama/Meta-Llama-3-8B --quantization=$CONFIG2 --linear_type=$CONFIG1 &>"$LOG_FILE" &
20+
done
21+
22+
wait
23+
done
24+
25+
26+
echo "All processes are complete."
Lines changed: 39 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,39 @@
1+
#!/bin/bash
2+
3+
# List of GPUs to use
4+
GPUS=(2 3 4 5 6 7)
5+
6+
# List of configuration files
7+
#CONFIGS1=("int6wo" "int5wo" "int2wo" "int3wo" "int8wo" "int4wo" "None" "autoquant")
8+
CONFIGS1=("2" "3" "4" "5" "6" "8")
9+
#CONFIGS1=(8 8 8 8 8 4 4 16)
10+
#CONFIGS2=(6 5 4 3 2 3 2 8)
11+
12+
#CONFIGS1=(16 16 16 16 16)
13+
#CONFIGS2=(6 5 4 3 2)
14+
15+
PYTHON_SCRIPT="scripts/mx_eval.py"
16+
17+
for i in "${!GPUS[@]}"; do
18+
GPU="${GPUS[$i]}"
19+
CONFIG1="${CONFIGS1[$i]}"
20+
21+
LOG_FILE="UNI_${CONFIG1}_SYM.txt"
22+
23+
CUDA_VISIBLE_DEVICES=$GPU python $PYTHON_SCRIPT --repo_id=checkpoints/meta-llama/Meta-Llama-3-8B --quantization=$CONFIG1 --quant_sym=sym &>"$LOG_FILE" &
24+
done
25+
26+
wait
27+
28+
for i in "${!GPUS[@]}"; do
29+
GPU="${GPUS[$i]}"
30+
CONFIG1="${CONFIGS1[$i]}"
31+
32+
LOG_FILE="UNI_${CONFIG1}_ASYM.txt"
33+
34+
CUDA_VISIBLE_DEVICES=$GPU python $PYTHON_SCRIPT --repo_id=checkpoints/meta-llama/Meta-Llama-3-8B --quantization=$CONFIG1 --quant_sym=asym &>"$LOG_FILE" &
35+
done
36+
37+
wait
38+
39+
echo "All processes are complete."
Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,10 @@
1+
#!/bin/bash
2+
PYTHON_SCRIPT="scripts/generate.py"
3+
python $PYTHON_SCRIPT --checkpoint_path=checkpoints/meta-llama/Meta-Llama-3-8B/model.pth --compile --quantization=int4wo --write_result uni_quant_benchmark_results.txt
4+
python $PYTHON_SCRIPT --checkpoint_path=checkpoints/meta-llama/Meta-Llama-3-8B/model.pth --compile --quantization=int8wo --write_result uni_quant_benchmark_results.txt
5+
python $PYTHON_SCRIPT --checkpoint_path=checkpoints/meta-llama/Meta-Llama-3-8B/model.pth --compile --quantization=2 --write_result uni_quant_benchmark_results.txt
6+
python $PYTHON_SCRIPT --checkpoint_path=checkpoints/meta-llama/Meta-Llama-3-8B/model.pth --compile --quantization=3 --write_result uni_quant_benchmark_results.txt
7+
python $PYTHON_SCRIPT --checkpoint_path=checkpoints/meta-llama/Meta-Llama-3-8B/model.pth --compile --quantization=5 --write_result uni_quant_benchmark_results.txt
8+
python $PYTHON_SCRIPT --checkpoint_path=checkpoints/meta-llama/Meta-Llama-3-8B/model.pth --compile --quantization=6 --write_result uni_quant_benchmark_results.txt
9+
10+
echo "All processes are complete."

0 commit comments

Comments
 (0)