Limit enable_t_mac to take effect on INT_N only.

2024-10-30 16:00:38 +08:00 · 2024-10-30 16:00:38 +08:00 · f84d25dd8f
commit f84d25dd8f
parent 080d2ecc56
1 changed files with 2 additions and 2 deletions
--- a/convert_hf_to_gguf.py
+++ b/convert_hf_to_gguf.py
@ -1798,8 +1798,8 @@ class BitnetModel(Model):
        ]):
            # transform weight into 1/0/-1 (in fp32)
            data_torch = self.weight_quant(data_torch)
-            if self.enable_t_mac:
+            if self.enable_t_mac and self.ftype == gguf.LlamaFileType.MOSTLY_INT_N:
-                # transform weight into T-MAC I2 format
+                # transform weight into T-MAC INT_N format
                from t_mac.model_utils import preprocess_for_t_mac
                data = LazyTorchTensor.to_eager(data_torch).numpy()
                scale = np.max(np.abs(data))