fix 32B model

ngxson · ngxson · commit 651752f1ae25 · 2025-04-30T22:04:06.000+02:00
diff --git a/convert_hf_to_gguf.py b/convert_hf_to_gguf.py
@@ -2579,15 +2579,20 @@ def set_gguf_parameters(self):
         elif self.global_config['model_type'] == 'qwen2_5_vl':
             self.gguf_writer.add_vision_projector_type(gguf.VisionProjectorType.QWEN25VL)
             self.gguf_writer.add_vision_use_silu(True)
-            # find n_wa_pattern (window attention pattern)
-            fullatt_block_indexes = hparams.get("fullatt_block_indexes")
-            assert fullatt_block_indexes is not None, "fullatt_block_indexes is required for qwen2_5_vl"
-            n_wa_pattern = fullatt_block_indexes[0] + 1
-            # validate n_wa_pattern
-            for i in range(1, len(fullatt_block_indexes)):
-                if fullatt_block_indexes[i] - fullatt_block_indexes[i - 1] != n_wa_pattern:
-                    raise ValueError(f"Invalid fullatt_block_indexes: {fullatt_block_indexes}")
-            self.gguf_writer.add_vision_n_wa_pattern(n_wa_pattern)
+            out_hidden_size = hparams.get("out_hidden_size")
+            if out_hidden_size == 5120:
+                # 32B model does not have n_wa_pattern, the other models do
+                self.gguf_writer.add_vision_n_wa_pattern(0)
+            else:
+                # find n_wa_pattern (window attention pattern)
+                fullatt_block_indexes = hparams.get("fullatt_block_indexes")
+                assert fullatt_block_indexes is not None, "fullatt_block_indexes is required for qwen2_5_vl"
+                n_wa_pattern = fullatt_block_indexes[0] + 1
+                # validate n_wa_pattern
+                for i in range(1, len(fullatt_block_indexes)):
+                    if fullatt_block_indexes[i] - fullatt_block_indexes[i - 1] != n_wa_pattern:
+                        raise ValueError(f"Invalid fullatt_block_indexes: {fullatt_block_indexes}")
+                self.gguf_writer.add_vision_n_wa_pattern(n_wa_pattern)
         else:
             raise ValueError(f"Unknown QwenVL model type: {self.global_config['model_type']}")
         # default values below are taken from HF tranformers code