fix rtn bug (#966)

mengniwang95 · web-flow · commit c4ef9a827bbb · 2025-10-30T18:10:54.000+08:00
diff --git a/auto_round/compressors/base.py b/auto_round/compressors/base.py
@@ -1312,10 +1312,11 @@ def _quantize_rtn(self) -> tuple[torch.nn.Module, dict[str, Any]]:
         self.model.to("cpu")
 
         enable_imatrix = False
-        if has_gguf_k and not self.disable_opt_rtn:
-            enable_imatrix = True
-        if self.data_type == "int" and self.sym:
-            enable_imatrix = True
+        if not self.disable_opt_rtn:
+            if has_gguf_k:
+                enable_imatrix = True
+            elif self.data_type == "int" and self.sym:
+                enable_imatrix = True
 
         if enable_imatrix:
             self._quant_rtn_with_imatrix(all_to_quantized_module_names)