diff options
| author | Paul Buetow <paul@buetow.org> | 2026-05-24 14:02:34 +0300 |
|---|---|---|
| committer | Paul Buetow <paul@buetow.org> | 2026-05-24 14:02:34 +0300 |
| commit | c8bd4d1e7a34ebf452d3d6c843d5cef785abe608 (patch) | |
| tree | ec1e6c19379c3ba86f6d80d90286eceae393b983 /pi | |
| parent | f16f4b753b3bf317e6da79f479ff5f506ed34b47 (diff) | |
replace qwen3-coder-next with qwen3.6-27b across configs, docs, and tooling
Diffstat (limited to 'pi')
| -rw-r--r-- | pi/agent/extensions/nemotron-tool-repair/index.ts | 2 | ||||
| -rw-r--r-- | pi/agent/models.json | 353 |
2 files changed, 286 insertions, 69 deletions
diff --git a/pi/agent/extensions/nemotron-tool-repair/index.ts b/pi/agent/extensions/nemotron-tool-repair/index.ts index 9bb8f94..ae59a66 100644 --- a/pi/agent/extensions/nemotron-tool-repair/index.ts +++ b/pi/agent/extensions/nemotron-tool-repair/index.ts @@ -20,7 +20,7 @@ import type { ExtensionAPI, ExtensionContext } from "@mariozechner/pi-coding-age const CUSTOM_API = "hyperstack-openai-completions-repaired"; const TARGET_PROVIDERS = new Set(["hyperstack1", "hyperstack2"]); const NEMOTRON_MODEL_PATTERN = /NVIDIA-Nemotron-3-Super/i; -// Matches all Qwen Coder variants (Qwen3-Coder-Next, Qwen3-Coder-30B, etc.) +// Matches Qwen3 Coder variants (Qwen3-Coder-30B, etc.) const QWEN_CODER_MODEL_PATTERN = /Qwen.*Coder/i; const MODELS_JSON_PATH = path.resolve( path.dirname(fileURLToPath(import.meta.url)), diff --git a/pi/agent/models.json b/pi/agent/models.json index 48cd0e9..a5e8200 100644 --- a/pi/agent/models.json +++ b/pi/agent/models.json @@ -14,8 +14,15 @@ "id": "openai/gpt-oss-120b", "name": "GPT-OSS 120B [vm]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 131072, "maxTokens": 8192 }, @@ -23,17 +30,31 @@ "id": "openai/gpt-oss-20b", "name": "GPT-OSS 20B [vm]", "reasoning": false, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 65536, "maxTokens": 8192 }, { - "id": "bullpoint/Qwen3-Coder-Next-AWQ-4bit", - "name": "Qwen3 Coder Next [vm]", + "id": "Qwen/Qwen3.6-27B-FP8", + "name": "Qwen3.6 27B FP8 [vm]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 262144, "maxTokens": 8192, "compat": { @@ -47,8 +68,15 @@ "id": "cyankiwi/gemma-4-31B-it-AWQ-4bit", "name": "Gemma 4 31B IT [vm]", "reasoning": false, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 131072, "maxTokens": 8192 }, @@ -56,8 +84,15 @@ "id": "cyankiwi/NVIDIA-Nemotron-3-Super-120B-A12B-AWQ-4bit", "name": "Nemotron 3 Super 120B [vm]", "reasoning": false, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 262144, "maxTokens": 8192 }, @@ -65,8 +100,15 @@ "id": "Qwen/Qwen2.5-Coder-32B-Instruct-AWQ", "name": "Qwen2.5 Coder 32B [vm]", "reasoning": false, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 32768, "maxTokens": 8192 }, @@ -74,8 +116,15 @@ "id": "QuantTrio/Qwen3-Coder-30B-A3B-Instruct-AWQ", "name": "Qwen3 Coder 30B [vm]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 65536, "maxTokens": 8192, "compat": { @@ -89,8 +138,15 @@ "id": "casperhansen/deepseek-r1-distill-qwen-32b-awq", "name": "DeepSeek-R1-Distill 32B [vm]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 32768, "maxTokens": 8192 }, @@ -98,8 +154,15 @@ "id": "Qwen/Qwen3-32B-AWQ", "name": "Qwen3 32B [vm]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 32768, "maxTokens": 8192, "compat": { @@ -113,8 +176,15 @@ "id": "cyankiwi/Devstral-Small-2507-AWQ-4bit", "name": "Devstral Small 2507 [vm]", "reasoning": false, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 32768, "maxTokens": 8192 } @@ -134,8 +204,15 @@ "id": "cyankiwi/gemma-4-31B-it-AWQ-4bit", "name": "Gemma 4 31B IT [vm1]", "reasoning": false, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 131072, "maxTokens": 8192 }, @@ -143,17 +220,31 @@ "id": "cyankiwi/NVIDIA-Nemotron-3-Super-120B-A12B-AWQ-4bit", "name": "Nemotron 3 Super 120B 1M [vm1]", "reasoning": false, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 1048576, "maxTokens": 8192 }, { - "id": "bullpoint/Qwen3-Coder-Next-AWQ-4bit", - "name": "Qwen3 Coder Next [vm1]", + "id": "Qwen/Qwen3.6-27B-FP8", + "name": "Qwen3.6 27B FP8 [vm1]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 262144, "maxTokens": 8192, "compat": { @@ -167,8 +258,15 @@ "id": "openai/gpt-oss-20b", "name": "GPT-OSS 20B [vm1]", "reasoning": false, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 65536, "maxTokens": 8192 }, @@ -176,8 +274,15 @@ "id": "openai/gpt-oss-120b", "name": "GPT-OSS 120B [vm1]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 131072, "maxTokens": 8192 }, @@ -185,8 +290,15 @@ "id": "Qwen/Qwen2.5-Coder-32B-Instruct-AWQ", "name": "Qwen2.5 Coder 32B [vm1]", "reasoning": false, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 32768, "maxTokens": 8192 }, @@ -194,8 +306,15 @@ "id": "QuantTrio/Qwen3-Coder-30B-A3B-Instruct-AWQ", "name": "Qwen3 Coder 30B [vm1]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 65536, "maxTokens": 8192, "compat": { @@ -209,8 +328,15 @@ "id": "casperhansen/deepseek-r1-distill-qwen-32b-awq", "name": "DeepSeek-R1-Distill 32B [vm1]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 32768, "maxTokens": 8192 }, @@ -218,8 +344,15 @@ "id": "Qwen/Qwen3-32B-AWQ", "name": "Qwen3 32B [vm1]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 32768, "maxTokens": 8192, "compat": { @@ -233,8 +366,15 @@ "id": "cyankiwi/Devstral-Small-2507-AWQ-4bit", "name": "Devstral Small 2507 [vm1]", "reasoning": false, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 32768, "maxTokens": 8192 } @@ -254,8 +394,15 @@ "id": "Qwen/Qwen3.6-27B-FP8", "name": "Qwen3.6 27B FP8 [vm2]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 262144, "maxTokens": 8192, "compat": { @@ -269,17 +416,31 @@ "id": "cyankiwi/gemma-4-31B-it-AWQ-4bit", "name": "Gemma 4 31B IT [vm2]", "reasoning": false, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 131072, "maxTokens": 8192 }, { - "id": "bullpoint/Qwen3-Coder-Next-AWQ-4bit", - "name": "Qwen3 Coder Next [vm2]", + "id": "Qwen/Qwen3.6-27B-FP8", + "name": "Qwen3.6 27B FP8 [vm2]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 262144, "maxTokens": 8192, "compat": { @@ -293,8 +454,15 @@ "id": "cyankiwi/NVIDIA-Nemotron-3-Super-120B-A12B-AWQ-4bit", "name": "Nemotron 3 Super 120B [vm2]", "reasoning": false, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 262144, "maxTokens": 8192 }, @@ -302,8 +470,15 @@ "id": "openai/gpt-oss-20b", "name": "GPT-OSS 20B [vm2]", "reasoning": false, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 65536, "maxTokens": 8192 }, @@ -311,8 +486,15 @@ "id": "openai/gpt-oss-120b", "name": "GPT-OSS 120B [vm2]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 131072, "maxTokens": 8192 }, @@ -320,8 +502,15 @@ "id": "Qwen/Qwen2.5-Coder-32B-Instruct-AWQ", "name": "Qwen2.5 Coder 32B [vm2]", "reasoning": false, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 32768, "maxTokens": 8192 }, @@ -329,8 +518,15 @@ "id": "QuantTrio/Qwen3-Coder-30B-A3B-Instruct-AWQ", "name": "Qwen3 Coder 30B [vm2]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 65536, "maxTokens": 8192, "compat": { @@ -344,8 +540,15 @@ "id": "casperhansen/deepseek-r1-distill-qwen-32b-awq", "name": "DeepSeek-R1-Distill 32B [vm2]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 32768, "maxTokens": 8192 }, @@ -353,8 +556,15 @@ "id": "Qwen/Qwen3-32B-AWQ", "name": "Qwen3 32B [vm2]", "reasoning": true, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 32768, "maxTokens": 8192, "compat": { @@ -368,8 +578,15 @@ "id": "cyankiwi/Devstral-Small-2507-AWQ-4bit", "name": "Devstral Small 2507 [vm2]", "reasoning": false, - "input": ["text"], - "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }, + "input": [ + "text" + ], + "cost": { + "input": 0, + "output": 0, + "cacheRead": 0, + "cacheWrite": 0 + }, "contextWindow": 32768, "maxTokens": 8192 } |
