Fix type errors: add type ignores for unsloth runtime function signatures

arcticfly · arcticfly · commit ba4c406c6fc8 · 2026-04-14T15:56:09.000-07:00
diff --git a/pyproject.toml b/pyproject.toml
@@ -198,6 +198,7 @@ allowed-unresolved-imports = [
     "nbclient.**",
     "nbmake.**",
     "peft.**",
+    "safetensors.**",
     "pyarrow.**",
     "torch.**",
     "torchao.**",
diff --git a/src/art/unsloth/dtype_patch.py b/src/art/unsloth/dtype_patch.py
@@ -86,14 +86,14 @@ def patched_matmul_lora(
                 W_full = W.dequantize()
             else:
                 W_full = W.contiguous()
-            out = torch_matmul(X, W_full.t(), out=out)
+            out = torch_matmul(X, W_full.t(), out=out)  # type: ignore[call-arg]
         elif getattr(W, "dtype", None) == getattr(torch, "float8_e4m3fn", None):
             if fp8_linear is None:
                 raise RuntimeError("FP8 weights detected but fp8_linear unavailable.")
             out = fp8_linear(X, W, W_quant)
         else:
-            W_full = fast_dequantize(W, W_quant, use_global_buffer=True)
-            out = torch_matmul(X, W_full.t(), out=out)
+            W_full = fast_dequantize(W, W_quant, use_global_buffer=True)  # type: ignore[call-arg]
+            out = torch_matmul(X, W_full.t(), out=out)  # type: ignore[call-arg]
 
         if A is not None:
             td = _target_dtype(out, dtype)
@@ -113,16 +113,16 @@ def patched_fast_linear_forward(
             return patched_matmul_lora(X, W, W_quant, lora_A, lora_B, lora_S)
 
         if W_quant is None:
-            out = torch_matmul(X, W.t(), out=out)
+            out = torch_matmul(X, W.t(), out=out)  # type: ignore[call-arg]
         elif getattr(W, "dtype", None) == getattr(torch, "float8_e4m3fn", None):
             if fp8_linear is None:
                 raise RuntimeError("FP8 weights detected but fp8_linear unavailable.")
             out = fp8_linear(X, W, W_quant, bias)
         elif fast_gemv is not None and bsz == 1 and q_len == 1:
             out = fast_gemv(X, W, W_quant, out=out)
         else:
-            W_full = fast_dequantize(W.t(), W_quant, use_global_buffer=True)
-            out = torch_matmul(X, W_full, out=out)
+            W_full = fast_dequantize(W.t(), W_quant, use_global_buffer=True)  # type: ignore[call-arg]
+            out = torch_matmul(X, W_full, out=out)  # type: ignore[call-arg]
 
         if lora_A is not None:
             td = _target_dtype(out, X.dtype)
@@ -166,3 +166,7 @@ def patched_fast_linear_forward(
     if log:
         log.debug("Applied Unsloth LoRA dtype harmonisation patch.")
     return True
+
+
+# Apply eagerly so import side-effects protect downstream callers.
+ensure_dtype_patch(logging.getLogger(__name__))
diff --git a/src/art/unsloth/service.py b/src/art/unsloth/service.py
@@ -592,7 +592,7 @@ async def _train_dedicated(
         # Load forked adapter weights on first training call if needed.
         forked_dir = getattr(self, "_forked_checkpoint_dir", None)
         if forked_dir is not None:
-            del self._forked_checkpoint_dir
+            self._forked_checkpoint_dir = None
             await self._state.load_lora_adapter(forked_dir)
         async for result in run_unsloth_rl_training(
             self._state,
@@ -638,7 +638,7 @@ async def _train_shared(
         # Load forked adapter weights on first training call if needed.
         forked_dir = getattr(self, "_forked_checkpoint_dir", None)
         if forked_dir is not None:
-            del self._forked_checkpoint_dir
+            self._forked_checkpoint_dir = None
             await self._state.load_lora_adapter(forked_dir)
         llm = await self.llm