File tree
4 files changed
+67
-25
lines changed- examples/models/llama
- source_transformation
- third-party
4 files changed
+67
-25
lines changedLines changed: 4 additions & 0 deletions
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
412 | 412 |
| |
413 | 413 |
| |
414 | 414 |
| |
| 415 | + | |
| 416 | + | |
| 417 | + | |
| 418 | + | |
415 | 419 |
| |
416 | 420 |
| |
417 | 421 |
| |
|
Lines changed: 29 additions & 13 deletions
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
155 | 155 |
| |
156 | 156 |
| |
157 | 157 |
| |
| 158 | + | |
| 159 | + | |
| 160 | + | |
| 161 | + | |
| 162 | + | |
158 | 163 |
| |
159 | 164 |
| |
160 | 165 |
| |
| |||
684 | 689 |
| |
685 | 690 |
| |
686 | 691 |
| |
| 692 | + | |
| 693 | + | |
| 694 | + | |
| 695 | + | |
| 696 | + | |
| 697 | + | |
| 698 | + | |
| 699 | + | |
| 700 | + | |
687 | 701 |
| |
688 | 702 |
| |
689 | 703 |
| |
| |||
1122 | 1136 |
| |
1123 | 1137 |
| |
1124 | 1138 |
| |
| 1139 | + | |
| 1140 | + | |
| 1141 | + | |
| 1142 | + | |
| 1143 | + | |
| 1144 | + | |
| 1145 | + | |
| 1146 | + | |
| 1147 | + | |
| 1148 | + | |
| 1149 | + | |
| 1150 | + | |
| 1151 | + | |
| 1152 | + | |
| 1153 | + | |
1125 | 1154 |
| |
1126 | 1155 |
| |
1127 | 1156 |
| |
| |||
1145 | 1174 |
| |
1146 | 1175 |
| |
1147 | 1176 |
| |
1148 |
| - | |
1149 |
| - | |
1150 |
| - | |
1151 |
| - | |
1152 |
| - | |
1153 |
| - | |
1154 |
| - | |
1155 |
| - | |
1156 |
| - | |
1157 |
| - | |
1158 |
| - | |
1159 |
| - | |
1160 |
| - | |
1161 | 1177 |
| |
1162 | 1178 |
| |
1163 | 1179 |
| |
|
Lines changed: 33 additions & 11 deletions
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
124 | 124 |
| |
125 | 125 |
| |
126 | 126 |
| |
127 |
| - | |
128 |
| - | |
129 |
| - | |
| 127 | + | |
130 | 128 |
| |
131 | 129 |
| |
132 | 130 |
| |
| |||
786 | 784 |
| |
787 | 785 |
| |
788 | 786 |
| |
789 |
| - | |
| 787 | + | |
| 788 | + | |
| 789 | + | |
| 790 | + | |
| 791 | + | |
| 792 | + | |
| 793 | + | |
| 794 | + | |
| 795 | + | |
| 796 | + | |
| 797 | + | |
| 798 | + | |
| 799 | + | |
| 800 | + | |
| 801 | + | |
| 802 | + | |
790 | 803 |
| |
791 | 804 |
| |
792 |
| - | |
| 805 | + | |
| 806 | + | |
| 807 | + | |
793 | 808 |
| |
794 | 809 |
| |
795 | 810 |
| |
796 |
| - | |
797 |
| - | |
798 |
| - | |
799 |
| - | |
800 |
| - | |
801 |
| - | |
| 811 | + | |
| 812 | + | |
| 813 | + | |
| 814 | + | |
| 815 | + | |
| 816 | + | |
| 817 | + | |
| 818 | + | |
| 819 | + | |
| 820 | + | |
| 821 | + | |
| 822 | + | |
| 823 | + | |
802 | 824 |
| |
803 | 825 |
| |
804 | 826 |
| |
|
- .github/workflows/float8nocompile_test.yaml+29-29
- .github/workflows/torchao_experimental_test.yml+1-1
- examples/sam2_amg_server/compile_export_utils.py+3-2
- examples/sam2_vos_example/compile_export_utils.py+3-2
- torchao/dtypes/uintx/tensor_core_tiled_layout.py+1-1
- torchao/experimental/kernels/cpu/aarch64/embedding/embedding.h+58
- torchao/experimental/kernels/cpu/aarch64/linear/channelwise_8bit_activation_groupwise_lowbit_weight_1x1x32_f32_neondot-impl.h+22-75
- torchao/experimental/kernels/cpu/aarch64/linear/channelwise_8bit_activation_groupwise_lowbit_weight_1x4x16_f32_neondot-impl.h+19-148
- torchao/experimental/kernels/cpu/aarch64/linear/channelwise_8bit_activation_groupwise_lowbit_weight_1x8x16_f32_neondot-impl.h+19-149
- torchao/experimental/kernels/cpu/aarch64/linear/pack_weights.h+467
- torchao/experimental/kernels/cpu/aarch64/tests/CMakeLists.txt+9
- torchao/experimental/kernels/cpu/aarch64/tests/build_and_run_tests.sh+1
- torchao/experimental/kernels/cpu/aarch64/tests/test_embedding.cpp+60-1
- torchao/experimental/kernels/cpu/aarch64/tests/test_weight_packing.cpp+118
- torchao/experimental/ops/embedding_xbit/op_embedding_xbit-impl.h+119
- torchao/experimental/ops/embedding_xbit/op_embedding_xbit_aten.cpp+35-19
- torchao/experimental/ops/embedding_xbit/op_embedding_xbit_executorch.cpp+28
- torchao/experimental/ops/linear_8bit_act_xbit_weight/kernel_selector.h+1-63
- torchao/experimental/ops/linear_8bit_act_xbit_weight/packed_weights_format.h+75
- torchao/experimental/ops/mps/test/test_lowbit.py+2-1
- torchao/experimental/packed_linear_int8_dynamic_activation_intx_weight_layout.py+26-16
- torchao/experimental/quant_api.py+370-72
- torchao/experimental/tests/test_embedding_xbit_quantizer.py+129-28
0 commit comments