pytorch
diff --git a/‎benchmark_sam.py
Lines changed: 0 additions & 95 deletions b/‎benchmark_sam.py
Lines changed: 0 additions & 95 deletions
diff --git a/‎torchao/quantization/__init__.py
Lines changed: 0 additions & 1 deletion b/‎torchao/quantization/__init__.py
Lines changed: 0 additions & 1 deletion
diff --git a/‎torchao/quantization/dynamic_quant_sparse.py
Lines changed: 0 additions & 166 deletions b/‎torchao/quantization/dynamic_quant_sparse.py
Lines changed: 0 additions & 166 deletions
diff --git a/‎torchao/quantization/quant_api.py
Lines changed: 0 additions & 13 deletions b/‎torchao/quantization/quant_api.py
Lines changed: 0 additions & 13 deletions
@@ -16,7 +16,6 @@
     "apply_weight_only_int8_quant",
     "apply_dynamic_quant",
     "change_linear_weights_to_int8_dqtensors",
-    "change_linear_weights_to_int8_dq_semi_structured_sparsetensors",
     "change_linear_weights_to_int8_woqtensors",
     "change_linear_weights_to_int4_woqtensors",
     "swap_conv2d_1x1_to_linear"
 
@@ -22,7 +22,6 @@
 from .subclass import (
     QuantizedLinearWeightBase,
     Int8DynamicallyQuantizedLinearWeight,
-    Int8DynamicallyQuantizedSemiStructuredSparseLinearWeight,
     Int8WeightOnlyQuantizedLinearWeight,
     Int4WeightOnlyQuantizedLinearWeight,
 )
@@ -34,7 +33,6 @@
     "apply_weight_only_int8_quant",
     "apply_dynamic_quant",
     "change_linear_weights_to_int8_dqtensors",
-    "change_linear_weights_to_int8_dq_semi_structured_sparsetensors",
     "change_linear_weights_to_int8_woqtensors",
     "change_linear_weights_to_int4_woqtensors",
     "swap_conv2d_1x1_to_linear"
@@ -155,17 +153,6 @@ def change_linear_weights_to_int4_woqtensors(model, **kwargs):
         filter_fn,
     )
 
-
-def change_linear_weights_to_int8_dq_semi_structured_sparsetensors(model, **kwargs):
-    filter_fn = kwargs.pop("filter_fn", _is_linear)
-
-    _replace_with_custom_fn_if_matches_filter(
-        model,
-        _get_subclass_inserter(Int8DynamicallyQuantizedSemiStructuredSparseLinearWeight, **kwargs),
-        filter_fn,
-    )
-
-
 def swap_conv2d_1x1_to_linear(model, filter_fn=None):
     """
     Changes all conv2d 1x1 modules to equivalent linear modules so that they can then be quantized.