From f8ccb577315769d0d0dfe3457d06afc6d471a289 Mon Sep 17 00:00:00 2001
From: Aiden Cline <aidenpcline@gmail.com>
Date: Wed, 10 Jun 2026 16:04:09 -0500
Subject: [PATCH 1/4] [nebius] Audit reasoning controls

---
 providers/nebius/models/MiniMaxAI/MiniMax-M2.5-fast.toml       | 1 +
 providers/nebius/models/MiniMaxAI/MiniMax-M2.5.toml            | 1 +
 providers/nebius/models/NousResearch/Hermes-4-405B.toml        | 3 ++-
 providers/nebius/models/NousResearch/Hermes-4-70B.toml         | 3 ++-
 .../nebius/models/Qwen/Qwen3-235B-A22B-Instruct-2507.toml      | 2 +-
 .../nebius/models/Qwen/Qwen3-235B-A22B-Thinking-2507-fast.toml | 1 +
 .../nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking-fast.toml   | 1 +
 providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking.toml  | 3 ++-
 providers/nebius/models/Qwen/Qwen3.5-397B-A17B-fast.toml       | 1 +
 providers/nebius/models/Qwen/Qwen3.5-397B-A17B.toml            | 1 +
 providers/nebius/models/deepseek-ai/DeepSeek-V3.2-fast.toml    | 1 +
 providers/nebius/models/deepseek-ai/DeepSeek-V3.2.toml         | 3 ++-
 providers/nebius/models/deepseek-ai/DeepSeek-V4-Pro.toml       | 1 +
 providers/nebius/models/moonshotai/Kimi-K2.5-fast.toml         | 1 +
 providers/nebius/models/moonshotai/Kimi-K2.5.toml              | 1 +
 providers/nebius/models/nvidia/Nemotron-3-Nano-Omni.toml       | 1 +
 providers/nebius/models/nvidia/nemotron-3-super-120b-a12b.toml | 1 +
 providers/nebius/models/openai/gpt-oss-120b-fast.toml          | 1 +
 providers/nebius/models/openai/gpt-oss-120b.toml               | 3 ++-
 providers/nebius/models/zai-org/GLM-5.toml                     | 1 +
 20 files changed, 25 insertions(+), 6 deletions(-)

diff --git a/providers/nebius/models/MiniMaxAI/MiniMax-M2.5-fast.toml b/providers/nebius/models/MiniMaxAI/MiniMax-M2.5-fast.toml
index 666c5c0fb..7028ba562 100644
--- a/providers/nebius/models/MiniMaxAI/MiniMax-M2.5-fast.toml
+++ b/providers/nebius/models/MiniMaxAI/MiniMax-M2.5-fast.toml
@@ -1,6 +1,7 @@
 name = "MiniMax-M2.5-fast"
 attachment = false
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/MiniMaxAI/MiniMax-M2.5.toml b/providers/nebius/models/MiniMaxAI/MiniMax-M2.5.toml
index fbb57563d..448e398d9 100644
--- a/providers/nebius/models/MiniMaxAI/MiniMax-M2.5.toml
+++ b/providers/nebius/models/MiniMaxAI/MiniMax-M2.5.toml
@@ -1,6 +1,7 @@
 name = "MiniMax-M2.5"
 attachment = false
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/NousResearch/Hermes-4-405B.toml b/providers/nebius/models/NousResearch/Hermes-4-405B.toml
index 728ad3080..61d1275cd 100644
--- a/providers/nebius/models/NousResearch/Hermes-4-405B.toml
+++ b/providers/nebius/models/NousResearch/Hermes-4-405B.toml
@@ -1,6 +1,7 @@
 name = "Hermes-4-405B"
 attachment = false
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
@@ -26,4 +27,4 @@ input = ["text"]
 output = ["text"]
 
 [interleaved]
-field = "reasoning_content"
\ No newline at end of file
+field = "reasoning_content"
diff --git a/providers/nebius/models/NousResearch/Hermes-4-70B.toml b/providers/nebius/models/NousResearch/Hermes-4-70B.toml
index 7080f0827..673a4fdce 100644
--- a/providers/nebius/models/NousResearch/Hermes-4-70B.toml
+++ b/providers/nebius/models/NousResearch/Hermes-4-70B.toml
@@ -1,6 +1,7 @@
 name = "Hermes-4-70B"
 attachment = false
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
@@ -26,4 +27,4 @@ input = ["text"]
 output = ["text"]
 
 [interleaved]
-field = "reasoning_content"
\ No newline at end of file
+field = "reasoning_content"
diff --git a/providers/nebius/models/Qwen/Qwen3-235B-A22B-Instruct-2507.toml b/providers/nebius/models/Qwen/Qwen3-235B-A22B-Instruct-2507.toml
index 5ef8658fc..7ced37cf1 100644
--- a/providers/nebius/models/Qwen/Qwen3-235B-A22B-Instruct-2507.toml
+++ b/providers/nebius/models/Qwen/Qwen3-235B-A22B-Instruct-2507.toml
@@ -3,7 +3,7 @@ family = "qwen"
 release_date = "2025-07-25"
 last_updated = "2025-10-04"
 attachment = false
-reasoning = true
+reasoning = false
 temperature = true
 knowledge = "2025-07"
 tool_call = true
diff --git a/providers/nebius/models/Qwen/Qwen3-235B-A22B-Thinking-2507-fast.toml b/providers/nebius/models/Qwen/Qwen3-235B-A22B-Thinking-2507-fast.toml
index 8ee0db949..f9761fb86 100644
--- a/providers/nebius/models/Qwen/Qwen3-235B-A22B-Thinking-2507-fast.toml
+++ b/providers/nebius/models/Qwen/Qwen3-235B-A22B-Thinking-2507-fast.toml
@@ -1,6 +1,7 @@
 name = "Qwen3-235B-A22B-Thinking-2507-fast"
 attachment = false
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking-fast.toml b/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking-fast.toml
index dc4f905ab..47be141e2 100644
--- a/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking-fast.toml
+++ b/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking-fast.toml
@@ -1,6 +1,7 @@
 name = "Qwen3-Next-80B-A3B-Thinking-fast"
 attachment = false
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking.toml b/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking.toml
index ca0b79132..926f404df 100644
--- a/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking.toml
+++ b/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking.toml
@@ -1,6 +1,7 @@
 name = "Qwen3-Next-80B-A3B-Thinking"
 attachment = false
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
@@ -26,4 +27,4 @@ input = ["text"]
 output = ["text"]
 
 [interleaved]
-field = "reasoning_content"
\ No newline at end of file
+field = "reasoning_content"
diff --git a/providers/nebius/models/Qwen/Qwen3.5-397B-A17B-fast.toml b/providers/nebius/models/Qwen/Qwen3.5-397B-A17B-fast.toml
index 9d17f88dd..6f7936044 100644
--- a/providers/nebius/models/Qwen/Qwen3.5-397B-A17B-fast.toml
+++ b/providers/nebius/models/Qwen/Qwen3.5-397B-A17B-fast.toml
@@ -1,6 +1,7 @@
 name = "Qwen3.5-397B-A17B-fast"
 attachment = false
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/Qwen/Qwen3.5-397B-A17B.toml b/providers/nebius/models/Qwen/Qwen3.5-397B-A17B.toml
index f84ebf4d8..233bcfe0b 100644
--- a/providers/nebius/models/Qwen/Qwen3.5-397B-A17B.toml
+++ b/providers/nebius/models/Qwen/Qwen3.5-397B-A17B.toml
@@ -1,6 +1,7 @@
 name = "Qwen3.5-397B-A17B"
 attachment = false
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/deepseek-ai/DeepSeek-V3.2-fast.toml b/providers/nebius/models/deepseek-ai/DeepSeek-V3.2-fast.toml
index 027b3e115..2902306f9 100644
--- a/providers/nebius/models/deepseek-ai/DeepSeek-V3.2-fast.toml
+++ b/providers/nebius/models/deepseek-ai/DeepSeek-V3.2-fast.toml
@@ -1,6 +1,7 @@
 name = "DeepSeek-V3.2-fast"
 attachment = false
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/deepseek-ai/DeepSeek-V3.2.toml b/providers/nebius/models/deepseek-ai/DeepSeek-V3.2.toml
index 147a25262..b34bc3257 100644
--- a/providers/nebius/models/deepseek-ai/DeepSeek-V3.2.toml
+++ b/providers/nebius/models/deepseek-ai/DeepSeek-V3.2.toml
@@ -1,6 +1,7 @@
 name = "DeepSeek-V3.2"
 attachment = false
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
@@ -26,4 +27,4 @@ input = ["text"]
 output = ["text"]
 
 [interleaved]
-field = "reasoning_content"
\ No newline at end of file
+field = "reasoning_content"
diff --git a/providers/nebius/models/deepseek-ai/DeepSeek-V4-Pro.toml b/providers/nebius/models/deepseek-ai/DeepSeek-V4-Pro.toml
index efd2d25ad..20783885e 100644
--- a/providers/nebius/models/deepseek-ai/DeepSeek-V4-Pro.toml
+++ b/providers/nebius/models/deepseek-ai/DeepSeek-V4-Pro.toml
@@ -1,4 +1,5 @@
 base_model = "deepseek/deepseek-v4-pro"
+reasoning_options = []
 
 [interleaved]
 field = "reasoning_content"
diff --git a/providers/nebius/models/moonshotai/Kimi-K2.5-fast.toml b/providers/nebius/models/moonshotai/Kimi-K2.5-fast.toml
index 6ac99aa62..6ec22eb58 100644
--- a/providers/nebius/models/moonshotai/Kimi-K2.5-fast.toml
+++ b/providers/nebius/models/moonshotai/Kimi-K2.5-fast.toml
@@ -4,6 +4,7 @@ release_date = "2025-12-15"
 last_updated = "2026-02-04"
 attachment = true
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/moonshotai/Kimi-K2.5.toml b/providers/nebius/models/moonshotai/Kimi-K2.5.toml
index 2e5e0747b..5d36574c1 100644
--- a/providers/nebius/models/moonshotai/Kimi-K2.5.toml
+++ b/providers/nebius/models/moonshotai/Kimi-K2.5.toml
@@ -4,6 +4,7 @@ release_date = "2025-12-15"
 last_updated = "2026-02-04"
 attachment = true
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/nvidia/Nemotron-3-Nano-Omni.toml b/providers/nebius/models/nvidia/Nemotron-3-Nano-Omni.toml
index 7a8f958d2..114b15c20 100644
--- a/providers/nebius/models/nvidia/Nemotron-3-Nano-Omni.toml
+++ b/providers/nebius/models/nvidia/Nemotron-3-Nano-Omni.toml
@@ -2,6 +2,7 @@ name = "Nemotron-3-Nano-Omni"
 base_model = "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning"
 attachment = false
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/nvidia/nemotron-3-super-120b-a12b.toml b/providers/nebius/models/nvidia/nemotron-3-super-120b-a12b.toml
index 238160399..ae14965ad 100644
--- a/providers/nebius/models/nvidia/nemotron-3-super-120b-a12b.toml
+++ b/providers/nebius/models/nvidia/nemotron-3-super-120b-a12b.toml
@@ -2,6 +2,7 @@ name = "Nemotron-3-Super-120B-A12B"
 base_model = "nvidia/nemotron-3-super-120b-a12b"
 attachment = false
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/openai/gpt-oss-120b-fast.toml b/providers/nebius/models/openai/gpt-oss-120b-fast.toml
index 660a3a101..bb17e7a5e 100644
--- a/providers/nebius/models/openai/gpt-oss-120b-fast.toml
+++ b/providers/nebius/models/openai/gpt-oss-120b-fast.toml
@@ -1,6 +1,7 @@
 name = "gpt-oss-120b-fast"
 attachment = false
 reasoning = true
+reasoning_options = [{ type = "effort", values = ["low", "medium", "high"] }]
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/openai/gpt-oss-120b.toml b/providers/nebius/models/openai/gpt-oss-120b.toml
index 2e61d87f2..c73b1027e 100644
--- a/providers/nebius/models/openai/gpt-oss-120b.toml
+++ b/providers/nebius/models/openai/gpt-oss-120b.toml
@@ -1,6 +1,7 @@
 name = "gpt-oss-120b"
 attachment = false
 reasoning = true
+reasoning_options = [{ type = "effort", values = ["low", "medium", "high"] }]
 tool_call = true
 structured_output = true
 temperature = true
@@ -26,4 +27,4 @@ input = ["text"]
 output = ["text"]
 
 [interleaved]
-field = "reasoning_content"
\ No newline at end of file
+field = "reasoning_content"
diff --git a/providers/nebius/models/zai-org/GLM-5.toml b/providers/nebius/models/zai-org/GLM-5.toml
index c2475bf92..dd1a41fac 100644
--- a/providers/nebius/models/zai-org/GLM-5.toml
+++ b/providers/nebius/models/zai-org/GLM-5.toml
@@ -1,6 +1,7 @@
 name = "GLM-5"
 attachment = false
 reasoning = true
+reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true

From 38a2f09999e93f2b328554c99ed7f21c65651ae8 Mon Sep 17 00:00:00 2001
From: Aiden Cline <aidenpcline@gmail.com>
Date: Wed, 10 Jun 2026 19:49:42 -0500
Subject: [PATCH 2/4] [nebius] Reconcile model lifecycle evidence

---
 .../models/MiniMaxAI/MiniMax-M2.5-fast.toml   |  2 +-
 .../nebius/models/MiniMaxAI/MiniMax-M2.5.toml |  1 -
 .../models/NousResearch/Hermes-4-405B.toml    |  1 -
 .../models/NousResearch/Hermes-4-70B.toml     |  1 -
 .../models/PrimeIntellect/INTELLECT-3.toml    |  3 ++-
 .../Qwen3-235B-A22B-Thinking-2507-fast.toml   |  1 +
 .../Qwen3-Next-80B-A3B-Thinking-fast.toml     |  2 +-
 .../Qwen/Qwen3-Next-80B-A3B-Thinking.toml     |  1 -
 .../models/Qwen/Qwen3.5-397B-A17B-fast.toml   |  2 +-
 .../nebius/models/Qwen/Qwen3.5-397B-A17B.toml |  1 -
 .../deepseek-ai/DeepSeek-V3.2-fast.toml       |  2 +-
 .../models/deepseek-ai/DeepSeek-V3.2.toml     |  2 +-
 .../models/deepseek-ai/DeepSeek-V4-Pro.toml   |  1 -
 .../nebius/models/google/gemma-2-2b-it.toml   | 25 -------------------
 .../Meta-Llama-3.1-8B-Instruct.toml           | 25 -------------------
 .../models/moonshotai/Kimi-K2.5-fast.toml     |  2 +-
 .../nebius/models/moonshotai/Kimi-K2.5.toml   |  2 +-
 .../models/nvidia/Nemotron-3-Nano-Omni.toml   |  1 -
 .../nvidia/nemotron-3-super-120b-a12b.toml    |  1 -
 .../models/openai/gpt-oss-120b-fast.toml      |  2 +-
 .../nebius/models/openai/gpt-oss-120b.toml    |  1 -
 providers/nebius/models/zai-org/GLM-5.toml    |  2 +-
 22 files changed, 12 insertions(+), 69 deletions(-)
 delete mode 100644 providers/nebius/models/google/gemma-2-2b-it.toml
 delete mode 100644 providers/nebius/models/meta-llama/Meta-Llama-3.1-8B-Instruct.toml

diff --git a/providers/nebius/models/MiniMaxAI/MiniMax-M2.5-fast.toml b/providers/nebius/models/MiniMaxAI/MiniMax-M2.5-fast.toml
index 7028ba562..ecb315de0 100644
--- a/providers/nebius/models/MiniMaxAI/MiniMax-M2.5-fast.toml
+++ b/providers/nebius/models/MiniMaxAI/MiniMax-M2.5-fast.toml
@@ -1,7 +1,7 @@
 name = "MiniMax-M2.5-fast"
 attachment = false
 reasoning = true
-reasoning_options = []
+status = "deprecated"
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/MiniMaxAI/MiniMax-M2.5.toml b/providers/nebius/models/MiniMaxAI/MiniMax-M2.5.toml
index 448e398d9..fbb57563d 100644
--- a/providers/nebius/models/MiniMaxAI/MiniMax-M2.5.toml
+++ b/providers/nebius/models/MiniMaxAI/MiniMax-M2.5.toml
@@ -1,7 +1,6 @@
 name = "MiniMax-M2.5"
 attachment = false
 reasoning = true
-reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/NousResearch/Hermes-4-405B.toml b/providers/nebius/models/NousResearch/Hermes-4-405B.toml
index 61d1275cd..a12ab2fbe 100644
--- a/providers/nebius/models/NousResearch/Hermes-4-405B.toml
+++ b/providers/nebius/models/NousResearch/Hermes-4-405B.toml
@@ -1,7 +1,6 @@
 name = "Hermes-4-405B"
 attachment = false
 reasoning = true
-reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/NousResearch/Hermes-4-70B.toml b/providers/nebius/models/NousResearch/Hermes-4-70B.toml
index 673a4fdce..309e99d89 100644
--- a/providers/nebius/models/NousResearch/Hermes-4-70B.toml
+++ b/providers/nebius/models/NousResearch/Hermes-4-70B.toml
@@ -1,7 +1,6 @@
 name = "Hermes-4-70B"
 attachment = false
 reasoning = true
-reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/PrimeIntellect/INTELLECT-3.toml b/providers/nebius/models/PrimeIntellect/INTELLECT-3.toml
index 743b1edb1..d2de6f510 100644
--- a/providers/nebius/models/PrimeIntellect/INTELLECT-3.toml
+++ b/providers/nebius/models/PrimeIntellect/INTELLECT-3.toml
@@ -1,6 +1,7 @@
 name = "INTELLECT-3"
 attachment = false
 reasoning = false
+status = "deprecated"
 tool_call = true
 structured_output = true
 temperature = true
@@ -22,4 +23,4 @@ output = 8_192
 
 [modalities]
 input = ["text"]
-output = ["text"]
\ No newline at end of file
+output = ["text"]
diff --git a/providers/nebius/models/Qwen/Qwen3-235B-A22B-Thinking-2507-fast.toml b/providers/nebius/models/Qwen/Qwen3-235B-A22B-Thinking-2507-fast.toml
index f9761fb86..68fb846cd 100644
--- a/providers/nebius/models/Qwen/Qwen3-235B-A22B-Thinking-2507-fast.toml
+++ b/providers/nebius/models/Qwen/Qwen3-235B-A22B-Thinking-2507-fast.toml
@@ -2,6 +2,7 @@ name = "Qwen3-235B-A22B-Thinking-2507-fast"
 attachment = false
 reasoning = true
 reasoning_options = []
+status = "deprecated"
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking-fast.toml b/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking-fast.toml
index 47be141e2..30e340dfd 100644
--- a/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking-fast.toml
+++ b/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking-fast.toml
@@ -1,7 +1,7 @@
 name = "Qwen3-Next-80B-A3B-Thinking-fast"
 attachment = false
 reasoning = true
-reasoning_options = []
+status = "deprecated"
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking.toml b/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking.toml
index 926f404df..9fb4fa80f 100644
--- a/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking.toml
+++ b/providers/nebius/models/Qwen/Qwen3-Next-80B-A3B-Thinking.toml
@@ -1,7 +1,6 @@
 name = "Qwen3-Next-80B-A3B-Thinking"
 attachment = false
 reasoning = true
-reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/Qwen/Qwen3.5-397B-A17B-fast.toml b/providers/nebius/models/Qwen/Qwen3.5-397B-A17B-fast.toml
index 6f7936044..8e7c18e3f 100644
--- a/providers/nebius/models/Qwen/Qwen3.5-397B-A17B-fast.toml
+++ b/providers/nebius/models/Qwen/Qwen3.5-397B-A17B-fast.toml
@@ -1,7 +1,7 @@
 name = "Qwen3.5-397B-A17B-fast"
 attachment = false
 reasoning = true
-reasoning_options = []
+status = "deprecated"
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/Qwen/Qwen3.5-397B-A17B.toml b/providers/nebius/models/Qwen/Qwen3.5-397B-A17B.toml
index 233bcfe0b..f84ebf4d8 100644
--- a/providers/nebius/models/Qwen/Qwen3.5-397B-A17B.toml
+++ b/providers/nebius/models/Qwen/Qwen3.5-397B-A17B.toml
@@ -1,7 +1,6 @@
 name = "Qwen3.5-397B-A17B"
 attachment = false
 reasoning = true
-reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/deepseek-ai/DeepSeek-V3.2-fast.toml b/providers/nebius/models/deepseek-ai/DeepSeek-V3.2-fast.toml
index 2902306f9..9aff42d93 100644
--- a/providers/nebius/models/deepseek-ai/DeepSeek-V3.2-fast.toml
+++ b/providers/nebius/models/deepseek-ai/DeepSeek-V3.2-fast.toml
@@ -1,7 +1,7 @@
 name = "DeepSeek-V3.2-fast"
 attachment = false
 reasoning = true
-reasoning_options = []
+status = "deprecated"
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/deepseek-ai/DeepSeek-V3.2.toml b/providers/nebius/models/deepseek-ai/DeepSeek-V3.2.toml
index b34bc3257..acda35bee 100644
--- a/providers/nebius/models/deepseek-ai/DeepSeek-V3.2.toml
+++ b/providers/nebius/models/deepseek-ai/DeepSeek-V3.2.toml
@@ -1,7 +1,7 @@
 name = "DeepSeek-V3.2"
 attachment = false
 reasoning = true
-reasoning_options = []
+status = "deprecated"
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/deepseek-ai/DeepSeek-V4-Pro.toml b/providers/nebius/models/deepseek-ai/DeepSeek-V4-Pro.toml
index 20783885e..efd2d25ad 100644
--- a/providers/nebius/models/deepseek-ai/DeepSeek-V4-Pro.toml
+++ b/providers/nebius/models/deepseek-ai/DeepSeek-V4-Pro.toml
@@ -1,5 +1,4 @@
 base_model = "deepseek/deepseek-v4-pro"
-reasoning_options = []
 
 [interleaved]
 field = "reasoning_content"
diff --git a/providers/nebius/models/google/gemma-2-2b-it.toml b/providers/nebius/models/google/gemma-2-2b-it.toml
deleted file mode 100644
index f5e60c4ed..000000000
--- a/providers/nebius/models/google/gemma-2-2b-it.toml
+++ /dev/null
@@ -1,25 +0,0 @@
-name = "Gemma-2-2b-it"
-attachment = false
-reasoning = false
-tool_call = false
-structured_output = false
-temperature = true
-knowledge = "2024-06"
-release_date = "2024-07-31"
-last_updated = "2026-02-04"
-open_weights = true
-
-[cost]
-input = 0.02
-output = 0.06
-cache_read = 0.002
-cache_write = 0.025
-
-[limit]
-context = 8_192
-input = 8_000
-output = 4_096
-
-[modalities]
-input = ["text"]
-output = ["text"]
\ No newline at end of file
diff --git a/providers/nebius/models/meta-llama/Meta-Llama-3.1-8B-Instruct.toml b/providers/nebius/models/meta-llama/Meta-Llama-3.1-8B-Instruct.toml
deleted file mode 100644
index ddb722a68..000000000
--- a/providers/nebius/models/meta-llama/Meta-Llama-3.1-8B-Instruct.toml
+++ /dev/null
@@ -1,25 +0,0 @@
-name = "Meta-Llama-3.1-8B-Instruct"
-attachment = false
-reasoning = false
-tool_call = true
-structured_output = true
-temperature = true
-knowledge = "2024-12"
-release_date = "2024-07-23"
-last_updated = "2026-02-04"
-open_weights = true
-
-[cost]
-input = 0.02
-output = 0.06
-cache_read = 0.002
-cache_write = 0.025
-
-[limit]
-context = 128_000
-input = 120_000
-output = 4_096
-
-[modalities]
-input = ["text"]
-output = ["text"]
\ No newline at end of file
diff --git a/providers/nebius/models/moonshotai/Kimi-K2.5-fast.toml b/providers/nebius/models/moonshotai/Kimi-K2.5-fast.toml
index 6ec22eb58..6f8a01495 100644
--- a/providers/nebius/models/moonshotai/Kimi-K2.5-fast.toml
+++ b/providers/nebius/models/moonshotai/Kimi-K2.5-fast.toml
@@ -4,7 +4,7 @@ release_date = "2025-12-15"
 last_updated = "2026-02-04"
 attachment = true
 reasoning = true
-reasoning_options = []
+status = "deprecated"
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/moonshotai/Kimi-K2.5.toml b/providers/nebius/models/moonshotai/Kimi-K2.5.toml
index 5d36574c1..d60bf396e 100644
--- a/providers/nebius/models/moonshotai/Kimi-K2.5.toml
+++ b/providers/nebius/models/moonshotai/Kimi-K2.5.toml
@@ -4,7 +4,7 @@ release_date = "2025-12-15"
 last_updated = "2026-02-04"
 attachment = true
 reasoning = true
-reasoning_options = []
+status = "deprecated"
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/nvidia/Nemotron-3-Nano-Omni.toml b/providers/nebius/models/nvidia/Nemotron-3-Nano-Omni.toml
index 114b15c20..7a8f958d2 100644
--- a/providers/nebius/models/nvidia/Nemotron-3-Nano-Omni.toml
+++ b/providers/nebius/models/nvidia/Nemotron-3-Nano-Omni.toml
@@ -2,7 +2,6 @@ name = "Nemotron-3-Nano-Omni"
 base_model = "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning"
 attachment = false
 reasoning = true
-reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/nvidia/nemotron-3-super-120b-a12b.toml b/providers/nebius/models/nvidia/nemotron-3-super-120b-a12b.toml
index ae14965ad..238160399 100644
--- a/providers/nebius/models/nvidia/nemotron-3-super-120b-a12b.toml
+++ b/providers/nebius/models/nvidia/nemotron-3-super-120b-a12b.toml
@@ -2,7 +2,6 @@ name = "Nemotron-3-Super-120B-A12B"
 base_model = "nvidia/nemotron-3-super-120b-a12b"
 attachment = false
 reasoning = true
-reasoning_options = []
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/openai/gpt-oss-120b-fast.toml b/providers/nebius/models/openai/gpt-oss-120b-fast.toml
index bb17e7a5e..07269642f 100644
--- a/providers/nebius/models/openai/gpt-oss-120b-fast.toml
+++ b/providers/nebius/models/openai/gpt-oss-120b-fast.toml
@@ -1,7 +1,7 @@
 name = "gpt-oss-120b-fast"
 attachment = false
 reasoning = true
-reasoning_options = [{ type = "effort", values = ["low", "medium", "high"] }]
+status = "deprecated"
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/openai/gpt-oss-120b.toml b/providers/nebius/models/openai/gpt-oss-120b.toml
index c73b1027e..a84ce3226 100644
--- a/providers/nebius/models/openai/gpt-oss-120b.toml
+++ b/providers/nebius/models/openai/gpt-oss-120b.toml
@@ -1,7 +1,6 @@
 name = "gpt-oss-120b"
 attachment = false
 reasoning = true
-reasoning_options = [{ type = "effort", values = ["low", "medium", "high"] }]
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/zai-org/GLM-5.toml b/providers/nebius/models/zai-org/GLM-5.toml
index dd1a41fac..6052648f6 100644
--- a/providers/nebius/models/zai-org/GLM-5.toml
+++ b/providers/nebius/models/zai-org/GLM-5.toml
@@ -1,7 +1,7 @@
 name = "GLM-5"
 attachment = false
 reasoning = true
-reasoning_options = []
+status = "deprecated"
 tool_call = true
 structured_output = true
 temperature = true

From 6799ff1078ece343fe2c50c7877c917c6ac9972a Mon Sep 17 00:00:00 2001
From: Aiden Cline <aidenpcline@gmail.com>
Date: Wed, 10 Jun 2026 20:02:58 -0500
Subject: [PATCH 3/4] [nebius] Correct verified reasoning controls

---
 .../nebius/models/Qwen/Qwen3-235B-A22B-Thinking-2507-fast.toml   | 1 -
 providers/nebius/models/Qwen/Qwen3.5-397B-A17B-fast.toml         | 1 +
 providers/nebius/models/Qwen/Qwen3.5-397B-A17B.toml              | 1 +
 providers/nebius/models/openai/gpt-oss-120b-fast.toml            | 1 +
 providers/nebius/models/openai/gpt-oss-120b.toml                 | 1 +
 providers/nebius/models/zai-org/GLM-5.toml                       | 1 +
 6 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/providers/nebius/models/Qwen/Qwen3-235B-A22B-Thinking-2507-fast.toml b/providers/nebius/models/Qwen/Qwen3-235B-A22B-Thinking-2507-fast.toml
index 68fb846cd..cb2cfd9fd 100644
--- a/providers/nebius/models/Qwen/Qwen3-235B-A22B-Thinking-2507-fast.toml
+++ b/providers/nebius/models/Qwen/Qwen3-235B-A22B-Thinking-2507-fast.toml
@@ -1,7 +1,6 @@
 name = "Qwen3-235B-A22B-Thinking-2507-fast"
 attachment = false
 reasoning = true
-reasoning_options = []
 status = "deprecated"
 tool_call = true
 structured_output = true
diff --git a/providers/nebius/models/Qwen/Qwen3.5-397B-A17B-fast.toml b/providers/nebius/models/Qwen/Qwen3.5-397B-A17B-fast.toml
index 8e7c18e3f..0bb3885a9 100644
--- a/providers/nebius/models/Qwen/Qwen3.5-397B-A17B-fast.toml
+++ b/providers/nebius/models/Qwen/Qwen3.5-397B-A17B-fast.toml
@@ -1,6 +1,7 @@
 name = "Qwen3.5-397B-A17B-fast"
 attachment = false
 reasoning = true
+reasoning_options = [{ type = "toggle" }]
 status = "deprecated"
 tool_call = true
 structured_output = true
diff --git a/providers/nebius/models/Qwen/Qwen3.5-397B-A17B.toml b/providers/nebius/models/Qwen/Qwen3.5-397B-A17B.toml
index f84ebf4d8..d007e174e 100644
--- a/providers/nebius/models/Qwen/Qwen3.5-397B-A17B.toml
+++ b/providers/nebius/models/Qwen/Qwen3.5-397B-A17B.toml
@@ -1,6 +1,7 @@
 name = "Qwen3.5-397B-A17B"
 attachment = false
 reasoning = true
+reasoning_options = [{ type = "toggle" }]
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/openai/gpt-oss-120b-fast.toml b/providers/nebius/models/openai/gpt-oss-120b-fast.toml
index 07269642f..5cebac08c 100644
--- a/providers/nebius/models/openai/gpt-oss-120b-fast.toml
+++ b/providers/nebius/models/openai/gpt-oss-120b-fast.toml
@@ -1,6 +1,7 @@
 name = "gpt-oss-120b-fast"
 attachment = false
 reasoning = true
+reasoning_options = [{ type = "effort", values = ["low", "medium", "high"] }]
 status = "deprecated"
 tool_call = true
 structured_output = true
diff --git a/providers/nebius/models/openai/gpt-oss-120b.toml b/providers/nebius/models/openai/gpt-oss-120b.toml
index a84ce3226..c73b1027e 100644
--- a/providers/nebius/models/openai/gpt-oss-120b.toml
+++ b/providers/nebius/models/openai/gpt-oss-120b.toml
@@ -1,6 +1,7 @@
 name = "gpt-oss-120b"
 attachment = false
 reasoning = true
+reasoning_options = [{ type = "effort", values = ["low", "medium", "high"] }]
 tool_call = true
 structured_output = true
 temperature = true
diff --git a/providers/nebius/models/zai-org/GLM-5.toml b/providers/nebius/models/zai-org/GLM-5.toml
index 6052648f6..099a4056c 100644
--- a/providers/nebius/models/zai-org/GLM-5.toml
+++ b/providers/nebius/models/zai-org/GLM-5.toml
@@ -1,6 +1,7 @@
 name = "GLM-5"
 attachment = false
 reasoning = true
+reasoning_options = [{ type = "toggle" }]
 status = "deprecated"
 tool_call = true
 structured_output = true

From 4c5b17b1db601ab11991b576ec54b0add181e838 Mon Sep 17 00:00:00 2001
From: Aiden Cline <aidenpcline@gmail.com>
Date: Wed, 10 Jun 2026 23:13:35 -0500
Subject: [PATCH 4/4] [nebius] Test generated provider matrix

---
 packages/core/test/nebius.test.ts | 133 ++++++++++++++++++++++++++++++
 1 file changed, 133 insertions(+)
 create mode 100644 packages/core/test/nebius.test.ts

diff --git a/packages/core/test/nebius.test.ts b/packages/core/test/nebius.test.ts
new file mode 100644
index 000000000..169c1bb46
--- /dev/null
+++ b/packages/core/test/nebius.test.ts
@@ -0,0 +1,133 @@
+import { expect, test } from "bun:test";
+import path from "node:path";
+
+import { generate } from "../src/index.js";
+
+const modelIDs = [
+  "MiniMaxAI/MiniMax-M2.5",
+  "MiniMaxAI/MiniMax-M2.5-fast",
+  "NousResearch/Hermes-4-405B",
+  "NousResearch/Hermes-4-70B",
+  "PrimeIntellect/INTELLECT-3",
+  "Qwen/Qwen2.5-VL-72B-Instruct",
+  "Qwen/Qwen3-235B-A22B-Instruct-2507",
+  "Qwen/Qwen3-235B-A22B-Thinking-2507-fast",
+  "Qwen/Qwen3-30B-A3B-Instruct-2507",
+  "Qwen/Qwen3-32B",
+  "Qwen/Qwen3-Embedding-8B",
+  "Qwen/Qwen3-Next-80B-A3B-Thinking",
+  "Qwen/Qwen3-Next-80B-A3B-Thinking-fast",
+  "Qwen/Qwen3.5-397B-A17B",
+  "Qwen/Qwen3.5-397B-A17B-fast",
+  "deepseek-ai/DeepSeek-V3.2",
+  "deepseek-ai/DeepSeek-V3.2-fast",
+  "deepseek-ai/DeepSeek-V4-Pro",
+  "google/gemma-3-27b-it",
+  "meta-llama/Llama-3.3-70B-Instruct",
+  "moonshotai/Kimi-K2.5",
+  "moonshotai/Kimi-K2.5-fast",
+  "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1",
+  "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B",
+  "nvidia/Nemotron-3-Nano-Omni",
+  "nvidia/nemotron-3-super-120b-a12b",
+  "openai/gpt-oss-120b",
+  "openai/gpt-oss-120b-fast",
+  "zai-org/GLM-5",
+].sort();
+
+const unresolvedReasoning = [
+  "MiniMaxAI/MiniMax-M2.5",
+  "MiniMaxAI/MiniMax-M2.5-fast",
+  "NousResearch/Hermes-4-405B",
+  "NousResearch/Hermes-4-70B",
+  "Qwen/Qwen3-235B-A22B-Thinking-2507-fast",
+  "Qwen/Qwen3-Next-80B-A3B-Thinking",
+  "Qwen/Qwen3-Next-80B-A3B-Thinking-fast",
+  "deepseek-ai/DeepSeek-V3.2",
+  "deepseek-ai/DeepSeek-V3.2-fast",
+  "deepseek-ai/DeepSeek-V4-Pro",
+  "moonshotai/Kimi-K2.5",
+  "moonshotai/Kimi-K2.5-fast",
+  "nvidia/Nemotron-3-Nano-Omni",
+  "nvidia/nemotron-3-super-120b-a12b",
+].sort();
+
+const deprecated = [
+  "MiniMaxAI/MiniMax-M2.5-fast",
+  "PrimeIntellect/INTELLECT-3",
+  "Qwen/Qwen3-235B-A22B-Thinking-2507-fast",
+  "Qwen/Qwen3-Next-80B-A3B-Thinking-fast",
+  "Qwen/Qwen3.5-397B-A17B-fast",
+  "deepseek-ai/DeepSeek-V3.2",
+  "deepseek-ai/DeepSeek-V3.2-fast",
+  "moonshotai/Kimi-K2.5",
+  "moonshotai/Kimi-K2.5-fast",
+  "openai/gpt-oss-120b-fast",
+  "zai-org/GLM-5",
+].sort();
+
+test("generated Nebius provider matches the reviewed model matrix", async () => {
+  const root = path.join(import.meta.dirname, "..", "..", "..");
+  const providers = await generate(path.join(root, "providers"));
+  const models = providers.nebius?.models;
+  expect(models).toBeDefined();
+  if (models === undefined) throw new Error("Nebius provider was not generated");
+
+  expect(Object.keys(models).sort()).toEqual(modelIDs);
+  expect(models).not.toHaveProperty("meta-llama/Meta-Llama-3.1-8B-Instruct");
+  expect(models).not.toHaveProperty("google/gemma-2-2b-it");
+
+  const verifiedControls = Object.fromEntries(
+    Object.entries(models)
+      .filter(([, model]) => model.reasoning_options !== undefined)
+      .map(([id, model]) => [id, model.reasoning_options]),
+  );
+  expect(verifiedControls).toEqual({
+    "Qwen/Qwen3.5-397B-A17B": [{ type: "toggle" }],
+    "Qwen/Qwen3.5-397B-A17B-fast": [{ type: "toggle" }],
+    "openai/gpt-oss-120b": [
+      { type: "effort", values: ["low", "medium", "high"] },
+    ],
+    "openai/gpt-oss-120b-fast": [
+      { type: "effort", values: ["low", "medium", "high"] },
+    ],
+    "zai-org/GLM-5": [{ type: "toggle" }],
+  });
+
+  expect(
+    Object.entries(models)
+      .filter(([, model]) => model.reasoning && model.reasoning_options === undefined)
+      .map(([id]) => id)
+      .sort(),
+  ).toEqual(unresolvedReasoning);
+  expect(
+    Object.entries(models)
+      .filter(([, model]) => model.reasoning_options?.length === 0)
+      .map(([id]) => id),
+  ).toEqual([]);
+  expect(
+    Object.entries(models)
+      .filter(([, model]) => !model.reasoning && model.reasoning_options !== undefined)
+      .map(([id]) => id),
+  ).toEqual([]);
+  expect(
+    Object.entries(models)
+      .filter(([, model]) => model.status === "deprecated")
+      .map(([id]) => id)
+      .sort(),
+  ).toEqual(deprecated);
+
+  expect(models["openai/gpt-oss-120b-fast"]?.reasoning_options).toEqual(
+    models["openai/gpt-oss-120b"]?.reasoning_options,
+  );
+  expect(models["Qwen/Qwen3.5-397B-A17B-fast"]?.reasoning_options).toEqual(
+    models["Qwen/Qwen3.5-397B-A17B"]?.reasoning_options,
+  );
+  expect(models["deepseek-ai/DeepSeek-V4-Pro"]).toMatchObject({
+    id: "deepseek-ai/DeepSeek-V4-Pro",
+    name: "DeepSeek V4 Pro",
+    reasoning: true,
+  });
+  expect(models["deepseek-ai/DeepSeek-V4-Pro"]).not.toHaveProperty("base_model");
+  expect(models["deepseek-ai/DeepSeek-V4-Pro"]?.reasoning_options).toBeUndefined();
+});