@@ -49,9 +49,9 @@ def setUpClass(self):
4949
5050 @parameterized .expand (
5151 [
52- # (QUANT_METHOD.GPTQ, BACKEND.AUTO, False, FORMAT.GPTQ, 8),
52+ (QUANT_METHOD .GPTQ , BACKEND .AUTO , False , FORMAT .GPTQ , 8 ),
5353 (QUANT_METHOD .GPTQ , BACKEND .EXLLAMA_V2 , True , FORMAT .GPTQ_V2 , 4 ),
54- # (QUANT_METHOD.GPTQ, BACKEND.EXLLAMA_V2, False, FORMAT.GPTQ, 4),
54+ (QUANT_METHOD .GPTQ , BACKEND .EXLLAMA_V2 , False , FORMAT .GPTQ , 4 ),
5555 ]
5656 )
5757 def test_quantize (self , method : QUANT_METHOD , backend : BACKEND , sym : bool , format : FORMAT , bits : int ):
@@ -115,12 +115,13 @@ def test_quantize(self, method: QUANT_METHOD, backend: BACKEND, sym: bool, forma
115115 if not sym and format == FORMAT .GPTQ or format == FORMAT .IPEX :
116116 return
117117
118- # test compat: 1) with simple dict type
118+ # test compat: 1) with simple dict type 2) is_marlin_format
119119 compat_quantize_config = {
120120 "bits" : bits ,
121121 "group_size" : 128 ,
122122 "sym" : sym ,
123123 "desc_act" : False if format == FORMAT .MARLIN else True ,
124+ "is_marlin_format" : backend == BACKEND .MARLIN ,
124125 }
125126
126127 model = GPTQModel .load (
0 commit comments