Fix type errors: add type ignores for unsloth runtime function signatures

arcticfly · arcticfly · commit 934689462c99 · 2026-04-14T15:38:44.000-07:00
diff --git a/pyproject.toml b/pyproject.toml
@@ -198,6 +198,7 @@ allowed-unresolved-imports = [
     "nbclient.**",
     "nbmake.**",
     "peft.**",
+    "safetensors.**",
     "pyarrow.**",
     "torch.**",
     "torchao.**",
diff --git a/src/art/unsloth/dtype_patch.py b/src/art/unsloth/dtype_patch.py
@@ -86,14 +86,14 @@ def patched_matmul_lora(
                 W_full = W.dequantize()
             else:
                 W_full = W.contiguous()
-            out = torch_matmul(X, W_full.t(), out=out)
+            out = torch_matmul(X, W_full.t(), out=out)  # type: ignore[call-arg]
         elif getattr(W, "dtype", None) == getattr(torch, "float8_e4m3fn", None):
             if fp8_linear is None:
                 raise RuntimeError("FP8 weights detected but fp8_linear unavailable.")
             out = fp8_linear(X, W, W_quant)
         else:
-            W_full = fast_dequantize(W, W_quant, use_global_buffer=True)
-            out = torch_matmul(X, W_full.t(), out=out)
+            W_full = fast_dequantize(W, W_quant, use_global_buffer=True)  # type: ignore[call-arg]
+            out = torch_matmul(X, W_full.t(), out=out)  # type: ignore[call-arg]
 
         if A is not None:
             td = _target_dtype(out, dtype)
@@ -113,16 +113,16 @@ def patched_fast_linear_forward(
             return patched_matmul_lora(X, W, W_quant, lora_A, lora_B, lora_S)
 
         if W_quant is None:
-            out = torch_matmul(X, W.t(), out=out)
+            out = torch_matmul(X, W.t(), out=out)  # type: ignore[call-arg]
         elif getattr(W, "dtype", None) == getattr(torch, "float8_e4m3fn", None):
             if fp8_linear is None:
                 raise RuntimeError("FP8 weights detected but fp8_linear unavailable.")
             out = fp8_linear(X, W, W_quant, bias)
         elif fast_gemv is not None and bsz == 1 and q_len == 1:
             out = fast_gemv(X, W, W_quant, out=out)
         else:
-            W_full = fast_dequantize(W.t(), W_quant, use_global_buffer=True)
-            out = torch_matmul(X, W_full, out=out)
+            W_full = fast_dequantize(W.t(), W_quant, use_global_buffer=True)  # type: ignore[call-arg]
+            out = torch_matmul(X, W_full, out=out)  # type: ignore[call-arg]
 
         if lora_A is not None:
             td = _target_dtype(out, X.dtype)