Skip to content

Commit fac758a

Browse files
Add WOQ int8 test with Inductor Freeze
1 parent ff42c85 commit fac758a

File tree

1 file changed

+7
-0
lines changed

1 file changed

+7
-0
lines changed

test/integration/test_integration.py

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1046,6 +1046,13 @@ def test_int8_weight_only_quant_subclass_api(self, device, dtype):
10461046
change_linear_weights_to_int8_woqtensors, device, 40, test_dtype=dtype
10471047
)
10481048

1049+
@parameterized.expand(COMMON_DEVICE_DTYPE)
1050+
@torch._inductor.config.patch({"freezing": True})
1051+
def test_int8_weight_only_quant_with_freeze(self, device, dtype):
1052+
self._test_lin_weight_subclass_api_impl(
1053+
change_linear_weights_to_int8_woqtensors, device, 40, test_dtype=dtype
1054+
)
1055+
10491056
@parameterized.expand(COMMON_DEVICE_DTYPE)
10501057
@unittest.skipIf(not TORCH_VERSION_AFTER_2_3, "int4 requires torch nightly.")
10511058
def test_int4_weight_only_quant_subclass_api(self, device, dtype):

0 commit comments

Comments
 (0)