Skip to content

Commit 00ea09a

Browse files
metascroyliangel-02
authored andcommitted
Move config out of experimental (#1954)
* init * up * up * up * up
1 parent ea50da4 commit 00ea09a

11 files changed

+597
-498
lines changed

.github/workflows/torchao_experimental_test.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -40,7 +40,7 @@ jobs:
4040
pip install numpy
4141
pip install pytest
4242
pip install parameterized
43-
USE_CPP=1 pip install .
43+
USE_CPP=1 TOCHAO_BUILD_KLEIDIAI=1 pip install .
4444
- name: Run python tests
4545
run: |
4646
conda activate venv

torchao/dtypes/__init__.py

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -20,9 +20,12 @@
2020
MarlinQQQLayout,
2121
MarlinQQQTensor,
2222
MarlinSparseLayout,
23+
PackedLinearInt8DynamicActivationIntxWeightLayout,
24+
QDQLayout,
2325
SemiSparseLayout,
2426
TensorCoreTiledLayout,
2527
UintxLayout,
28+
to_affine_quantized_packed_linear_int8_dynamic_activation_intx_weight,
2629
to_marlinqqq_quantized_intx,
2730
)
2831
from .utils import (
@@ -54,4 +57,7 @@
5457
"Int4CPULayout",
5558
"CutlassInt4PackedLayout",
5659
"CutlassSemiSparseLayout",
60+
"QDQLayout",
61+
"PackedLinearInt8DynamicActivationIntxWeightLayout",
62+
"to_affine_quantized_packed_linear_int8_dynamic_activation_intx_weight",
5763
]

torchao/dtypes/affine_quantized_tensor_ops.py

Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -51,13 +51,25 @@
5151
_linear_fp_act_int4_weight_sparse_marlin_check,
5252
_linear_fp_act_int4_weight_sparse_marlin_impl,
5353
)
54+
from torchao.dtypes.uintx.packed_linear_int8_dynamic_activation_intx_weight_layout import (
55+
_linear_check as _linear_int8_act_intx_weight_packed_check,
56+
)
57+
from torchao.dtypes.uintx.packed_linear_int8_dynamic_activation_intx_weight_layout import (
58+
_linear_impl as _linear_int8_act_intx_weight_packed_impl,
59+
)
5460
from torchao.dtypes.uintx.plain_layout import (
5561
PlainAQTTensorImpl,
5662
_linear_fp_act_int8_weight_check,
5763
_linear_fp_act_int8_weight_impl,
5864
_linear_int8_act_int8_weight_check,
5965
_linear_int8_act_int8_weight_impl,
6066
)
67+
from torchao.dtypes.uintx.q_dq_layout import (
68+
_linear_check as _linear_q_dq_check,
69+
)
70+
from torchao.dtypes.uintx.q_dq_layout import (
71+
_linear_impl as _linear_q_dq_impl,
72+
)
6173
from torchao.dtypes.uintx.semi_sparse_layout import (
6274
_linear_int8_act_int8_weight_semi_structured_sparse_check,
6375
_linear_int8_act_int8_weight_semi_structured_sparse_impl,
@@ -199,6 +211,14 @@ def _register_aqt_quantized_linear_dispatches():
199211
_linear_fp_act_uint4_weight_cpu_check,
200212
_linear_fp_act_uint4_weight_cpu_impl,
201213
),
214+
(
215+
_linear_int8_act_intx_weight_packed_check,
216+
_linear_int8_act_intx_weight_packed_impl,
217+
),
218+
(
219+
_linear_q_dq_check,
220+
_linear_q_dq_impl,
221+
),
202222
]:
203223
register_aqt_quantized_linear_dispatch(dispatch_condition, impl)
204224

torchao/dtypes/uintx/__init__.py

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -15,6 +15,13 @@
1515
from .marlin_sparse_layout import (
1616
MarlinSparseLayout,
1717
)
18+
from .packed_linear_int8_dynamic_activation_intx_weight_layout import (
19+
PackedLinearInt8DynamicActivationIntxWeightLayout,
20+
to_affine_quantized_packed_linear_int8_dynamic_activation_intx_weight,
21+
)
22+
from .q_dq_layout import (
23+
QDQLayout,
24+
)
1825
from .semi_sparse_layout import (
1926
SemiSparseLayout,
2027
)
@@ -36,4 +43,7 @@
3643
"MarlinQQQTensor",
3744
"to_marlinqqq_quantized_intx",
3845
"CutlassInt4PackedLayout",
46+
"to_affine_quantized_packed_linear_int8_dynamic_activation_intx_weight",
47+
"PackedLinearInt8DynamicActivationIntxWeightLayout",
48+
"QDQLayout",
3949
]

0 commit comments

Comments
 (0)