We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent e919558 commit 09b8b3cCopy full SHA for 09b8b3c
torchao/quantization/__init__.py
@@ -46,11 +46,11 @@
46
"int4_weight_only",
47
"int8_weight_only",
48
"uintx_weight_only",
49
- "float8_weight_only",
50
"fpx_weight_only",
51
"LinearActivationQuantizedTensor",
52
"to_linear_activation_quantized",
53
"to_weight_tensor_with_linear_activation_scale_metadata",
54
"float8_weight_only",
55
- "float8_dynamic_activation_float8_weight"
+ "float8_dynamic_activation_float8_weight",
+ "float8_static_activation_float8_weight"
56
]
torchao/quantization/quant_api.py
@@ -93,6 +93,7 @@
93
94
95
"float8_dynamic_activation_float8_weight",
96
+ "float8_static_activation_float8_weight",
97
98
99
from .GPTQ import (
0 commit comments