diff --git a/docs/source/llm_recipes.md b/docs/source/llm_recipes.md index 5f04242516b..328bba3ba09 100644 --- a/docs/source/llm_recipes.md +++ b/docs/source/llm_recipes.md @@ -29,8 +29,8 @@ This document aims to publish the specific recipes we achieved for the popular L | databricks/dolly-v2-12b | ✖ | ✔ | ✖ | | EleutherAI/gpt-neox-20b | ✖ | ✔ | ✔ | | mistralai/Mistral-7B-v0.1 | ✖ | ✔ | ✔ | -| THUDM/chatglm2-6b | WIP | ✔ | ✔ | -| THUDM/chatglm3-6b | WIP | ✔ | ✔ | +| THUDM/chatglm2-6b | ✔ | ✔ | ✔ | +| THUDM/chatglm3-6b | WIP | ✔ | WIP | **Detail recipes can be found [HERE](https://github.com/intel/intel-extension-for-transformers/blob/main/examples/huggingface/pytorch/text-generation/quantization/llm_quantization_recipes.md).** @@ -40,8 +40,8 @@ This document aims to publish the specific recipes we achieved for the popular L > - The WIP recipes will be published soon. ## Large Language Models Accuracy -
| Model | lambada_openai | @@ -63,212 +63,210 @@ This document aims to publish the specific recipes we achieved for the popular LRatio | ACC | Ratio | -|||||||||||||
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| baichuan-inc/Baichuan-13B-Chat | 67.57% | -68.23% | -1.0098 | -67.57% | -1.0000 | -67.84% | -1.0040 | -NA | -NA | +69.07% | +1.0222 | +67.55% | +0.9997 | +68.12% | +1.0081 | +66.93% | +0.9905 |
| baichuan-inc/Baichuan2-13B-Chat | 71.51% | -70.89% | -0.9913 | -71.53% | -1.0003 | -71.76% | -1.0035 | -NA | -NA | +75.57% | +1.0568 | +71.57% | +1.0008 | +70.81% | +0.9902 | +N/A | +N/A |
| baichuan-inc/Baichuan2-7B-Chat | 67.67% | -67.96% | -1.0043 | -67.59% | -0.9988 | -67.24% | -0.9936 | -67.42% | -0.9963 | +68.06% | +1.0058 | +67.61% | +0.9991 | +67.90% | +1.0034 | +N/A | +N/A |
| bigscience/bloom-1b7 | 46.34% | 47.99% | 1.0356 | -46.38% | -1.0009 | -46.19% | -0.9968 | -NA | -NA | +46.21% | +0.9972 | +46.90% | +1.0121 | +N/A | +N/A | ||
| databricks/dolly-v2-12b | 64.35% | -NA | -NA | -64.10% | -0.9961 | -NA | -NA | -NA | -NA | +N/A | +N/A | +63.92% | +0.9933 | +N/A | +N/A | +N/A | +N/A |
| EleutherAI/gpt-j-6b | 68.31% | -68.33% | -1.0003 | -68.23% | -0.9988 | -68.79% | -1.0070 | -68.43% | -1.0018 | +68.27% | +0.9994 | +68.27% | +0.9994 | +68.35% | +1.0006 | +68.02% | +0.9958 |
| EleutherAI/gpt-neox-20b | 72.33% | -NA | -NA | -72.25% | -0.9989 | -71.96% | -0.9949 | -NA | -NA | +N/A | +N/A | +72.29% | +0.9994 | +71.74% | +0.9918 | +N/A | +N/A |
| facebook/opt-1.3b | 57.89% | -57.54% | -0.9940 | -58.08% | -1.0033 | -58.57% | -1.0117 | -NA | -NA | +57.68% | +0.9964 | +58.12% | +1.0040 | +58.26% | +1.0064 | +N/A | +N/A |
| facebook/opt-30b | 71.49% | -71.51% | -1.0003 | -71.51% | -1.0003 | -71.82% | -1.0046 | -72.11% | -1.0087 | +71.78% | +1.0041 | +71.53% | +1.0006 | +71.59% | +1.0014 | +71.80% | +1.0043 |
| meta-llama/Llama-2-13b-hf | 76.77% | 76.25% | 0.9932 | -76.75% | -0.9997 | -77.43% | -1.0086 | -76.75% | -0.9997 | +76.89% | +1.0016 | +77.66% | +1.0116 | +76.60% | +0.9978 | ||
| meta-llama/Llama-2-70b-hf | 79.64% | -79.55% | -0.9989 | -79.57% | -0.9991 | +79.14% | +0.9937 | +79.62% | +0.9997 | 80.09% | 1.0057 | -79.97% | -1.0041 | +79.68% | +1.0005 | ||
| meta-llama/Llama-2-7b-hf | 73.92% | 73.45% | 0.9936 | -73.96% | -1.0005 | -73.45% | -0.9936 | -73.49% | -0.9942 | +73.90% | +0.9997 | +73.84% | +0.9989 | +N/A | +N/A | ||
| mistralai/Mistral-7B-v0.1 | 75.90% | -NA | -NA | +N/A | +N/A | 75.80% | 0.9987 | -76.13% | -1.0030 | -75.61% | -0.9962 | +76.25% | +1.0046 | +75.74% | +0.9979 | ||
| THUDM/chatglm2-6b | 53.23% | -NA | -NA | -53.19% | -0.9992 | -52.77% | -0.9914 | -53.35% | -1.0023 | +52.86% | +0.9930 | +53.00% | +0.9957 | +52.90% | +0.9938 | +52.92% | +0.9942 |
| THUDM/chatglm3-6b | 59.09% | -NA | -NA | -59.01% | -0.9986 | -NA | -NA | -58.61% | -0.9919 | +N/A | +N/A | +59.03% | +0.9990 | +N/A | +N/A | +N/A | +N/A |
| tiiuae/falcon-40b | 77.22% | -77.04% | -0.9977 | -77.22% | -1.0000 | -77.94% | -1.0093 | -78.79% | -1.0203 | +76.95% | +0.9965 | +77.18% | +0.9995 | +77.55% | +1.0043 | +77.82% | +1.0078 |
| tiiuae/falcon-7b | 74.67% | -76.44% | -1.0237 | -74.77% | -1.0013 | -75.00% | -1.0044 | -NA | -NA | +76.63% | +1.0262 | +74.73% | +1.0008 | +75.06% | +1.0052 | +74.00% | +0.9910 |