Created
September 11, 2024 20:07
-
-
Save HDCharles/0a484ef22083f11bb12dace8b58434a4 to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
export CHECKPOINT_PATH=../../../checkpoints # path to checkpoints folder | |
# README EVALUATIONS | |
export MODEL_REPO=meta-llama/Llama-2-7b-chat-hf | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth #12.212 | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization int8dq --compile #12.262 | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization int8wo #12.204 | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization fp6 --compile --precision float16 #12.369 | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization int4wo-64-hqq #12.825717540084083 | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization int4wo-64 #12.87233037343588 | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization int4wo-64-gptq #12.52718459353295 | |
export MODEL_REPO=meta-llama/Llama-2-7b-chat-hf | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth # 7.441690325135099 | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization int8wo #7.446656500265082 | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization int8dq --compile #7.580966566552427 | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization fp6 --compile --precision float16 #7.661 | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization int4wo-64-gptq #7.92162375549669 | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization int4wo-64-hqq #8.11014201472444 | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization int4wo-64 #8.316368680280947 | |
# OTHER EVALUATIONS | |
export MODEL_REPO=meta-llama/Llama-2-7b-chat-hf | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization uintx-4-64-hqq --compile # 12.775 | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization uintx-2-8-hqq --compile # 24.500 | |
export MODEL_REPO=meta-llama/Meta-Llama-3-8B | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization uintx-4-64-hqq --compile # 8.124 | |
python eval.py --checkpoint_path $CHECKPOINT_PATH/$MODEL_REPO/model.pth --quantization uintx-2-8-hqq --compile # 39.605 |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment