File tree
4 files changed
+67
-25
lines changed- examples/models/llama
- source_transformation
- third-party
4 files changed
+67
-25
lines changed| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
412 | 412 | | |
413 | 413 | | |
414 | 414 | | |
| 415 | + | |
| 416 | + | |
| 417 | + | |
| 418 | + | |
415 | 419 | | |
416 | 420 | | |
417 | 421 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
161 | 161 | | |
162 | 162 | | |
163 | 163 | | |
| 164 | + | |
| 165 | + | |
| 166 | + | |
| 167 | + | |
| 168 | + | |
164 | 169 | | |
165 | 170 | | |
166 | 171 | | |
| |||
664 | 669 | | |
665 | 670 | | |
666 | 671 | | |
| 672 | + | |
| 673 | + | |
| 674 | + | |
| 675 | + | |
| 676 | + | |
| 677 | + | |
| 678 | + | |
| 679 | + | |
| 680 | + | |
667 | 681 | | |
668 | 682 | | |
669 | 683 | | |
| |||
1111 | 1125 | | |
1112 | 1126 | | |
1113 | 1127 | | |
| 1128 | + | |
| 1129 | + | |
| 1130 | + | |
| 1131 | + | |
| 1132 | + | |
| 1133 | + | |
| 1134 | + | |
| 1135 | + | |
| 1136 | + | |
| 1137 | + | |
| 1138 | + | |
| 1139 | + | |
| 1140 | + | |
| 1141 | + | |
| 1142 | + | |
1114 | 1143 | | |
1115 | 1144 | | |
1116 | 1145 | | |
| |||
1130 | 1159 | | |
1131 | 1160 | | |
1132 | 1161 | | |
1133 | | - | |
1134 | | - | |
1135 | | - | |
1136 | | - | |
1137 | | - | |
1138 | | - | |
1139 | | - | |
1140 | | - | |
1141 | | - | |
1142 | | - | |
1143 | | - | |
1144 | | - | |
1145 | | - | |
1146 | 1162 | | |
1147 | 1163 | | |
1148 | 1164 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
105 | 105 | | |
106 | 106 | | |
107 | 107 | | |
108 | | - | |
109 | | - | |
110 | | - | |
| 108 | + | |
111 | 109 | | |
112 | 110 | | |
113 | 111 | | |
| |||
752 | 750 | | |
753 | 751 | | |
754 | 752 | | |
755 | | - | |
| 753 | + | |
| 754 | + | |
| 755 | + | |
| 756 | + | |
| 757 | + | |
| 758 | + | |
| 759 | + | |
| 760 | + | |
| 761 | + | |
| 762 | + | |
| 763 | + | |
| 764 | + | |
| 765 | + | |
| 766 | + | |
| 767 | + | |
| 768 | + | |
756 | 769 | | |
757 | 770 | | |
758 | | - | |
| 771 | + | |
| 772 | + | |
| 773 | + | |
759 | 774 | | |
760 | 775 | | |
761 | 776 | | |
762 | | - | |
763 | | - | |
764 | | - | |
765 | | - | |
766 | | - | |
767 | | - | |
| 777 | + | |
| 778 | + | |
| 779 | + | |
| 780 | + | |
| 781 | + | |
| 782 | + | |
| 783 | + | |
| 784 | + | |
| 785 | + | |
| 786 | + | |
| 787 | + | |
| 788 | + | |
| 789 | + | |
768 | 790 | | |
769 | 791 | | |
770 | 792 | | |
| |||
- .github/workflows/torchao_experimental_test.yml+1-1
- examples/sam2_amg_server/compile_export_utils.py+3-2
- examples/sam2_vos_example/compile_export_utils.py+3-2
- torchao/dtypes/uintx/tensor_core_tiled_layout.py+1-1
- torchao/experimental/kernels/cpu/aarch64/embedding/embedding.h+58
- torchao/experimental/kernels/cpu/aarch64/linear/channelwise_8bit_activation_groupwise_lowbit_weight_1x1x32_f32_neondot-impl.h+22-75
- torchao/experimental/kernels/cpu/aarch64/linear/channelwise_8bit_activation_groupwise_lowbit_weight_1x4x16_f32_neondot-impl.h+19-148
- torchao/experimental/kernels/cpu/aarch64/linear/channelwise_8bit_activation_groupwise_lowbit_weight_1x8x16_f32_neondot-impl.h+19-149
- torchao/experimental/kernels/cpu/aarch64/linear/pack_weights.h+467
- torchao/experimental/kernels/cpu/aarch64/tests/CMakeLists.txt+9
- torchao/experimental/kernels/cpu/aarch64/tests/build_and_run_tests.sh+1
- torchao/experimental/kernels/cpu/aarch64/tests/test_embedding.cpp+60-1
- torchao/experimental/kernels/cpu/aarch64/tests/test_weight_packing.cpp+118
- torchao/experimental/ops/embedding_xbit/op_embedding_xbit-impl.h+119
- torchao/experimental/ops/embedding_xbit/op_embedding_xbit_aten.cpp+35-19
- torchao/experimental/ops/embedding_xbit/op_embedding_xbit_executorch.cpp+28
- torchao/experimental/ops/linear_8bit_act_xbit_weight/kernel_selector.h+1-63
- torchao/experimental/ops/linear_8bit_act_xbit_weight/packed_weights_format.h+75
- torchao/experimental/ops/mps/test/test_lowbit.py+2-1
- torchao/experimental/packed_linear_int8_dynamic_activation_intx_weight_layout.py+26-16
- torchao/experimental/quant_api.py+370-72
- torchao/experimental/tests/test_embedding_xbit_quantizer.py+129-28
0 commit comments