summaryrefslogtreecommitdiff
path: root/pi
diff options
context:
space:
mode:
authorPaul Buetow <paul@buetow.org>2026-05-24 14:02:34 +0300
committerPaul Buetow <paul@buetow.org>2026-05-24 14:02:34 +0300
commitc8bd4d1e7a34ebf452d3d6c843d5cef785abe608 (patch)
treeec1e6c19379c3ba86f6d80d90286eceae393b983 /pi
parentf16f4b753b3bf317e6da79f479ff5f506ed34b47 (diff)
replace qwen3-coder-next with qwen3.6-27b across configs, docs, and tooling
Diffstat (limited to 'pi')
-rw-r--r--pi/agent/extensions/nemotron-tool-repair/index.ts2
-rw-r--r--pi/agent/models.json353
2 files changed, 286 insertions, 69 deletions
diff --git a/pi/agent/extensions/nemotron-tool-repair/index.ts b/pi/agent/extensions/nemotron-tool-repair/index.ts
index 9bb8f94..ae59a66 100644
--- a/pi/agent/extensions/nemotron-tool-repair/index.ts
+++ b/pi/agent/extensions/nemotron-tool-repair/index.ts
@@ -20,7 +20,7 @@ import type { ExtensionAPI, ExtensionContext } from "@mariozechner/pi-coding-age
const CUSTOM_API = "hyperstack-openai-completions-repaired";
const TARGET_PROVIDERS = new Set(["hyperstack1", "hyperstack2"]);
const NEMOTRON_MODEL_PATTERN = /NVIDIA-Nemotron-3-Super/i;
-// Matches all Qwen Coder variants (Qwen3-Coder-Next, Qwen3-Coder-30B, etc.)
+// Matches Qwen3 Coder variants (Qwen3-Coder-30B, etc.)
const QWEN_CODER_MODEL_PATTERN = /Qwen.*Coder/i;
const MODELS_JSON_PATH = path.resolve(
path.dirname(fileURLToPath(import.meta.url)),
diff --git a/pi/agent/models.json b/pi/agent/models.json
index 48cd0e9..a5e8200 100644
--- a/pi/agent/models.json
+++ b/pi/agent/models.json
@@ -14,8 +14,15 @@
"id": "openai/gpt-oss-120b",
"name": "GPT-OSS 120B [vm]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 131072,
"maxTokens": 8192
},
@@ -23,17 +30,31 @@
"id": "openai/gpt-oss-20b",
"name": "GPT-OSS 20B [vm]",
"reasoning": false,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 65536,
"maxTokens": 8192
},
{
- "id": "bullpoint/Qwen3-Coder-Next-AWQ-4bit",
- "name": "Qwen3 Coder Next [vm]",
+ "id": "Qwen/Qwen3.6-27B-FP8",
+ "name": "Qwen3.6 27B FP8 [vm]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 262144,
"maxTokens": 8192,
"compat": {
@@ -47,8 +68,15 @@
"id": "cyankiwi/gemma-4-31B-it-AWQ-4bit",
"name": "Gemma 4 31B IT [vm]",
"reasoning": false,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 131072,
"maxTokens": 8192
},
@@ -56,8 +84,15 @@
"id": "cyankiwi/NVIDIA-Nemotron-3-Super-120B-A12B-AWQ-4bit",
"name": "Nemotron 3 Super 120B [vm]",
"reasoning": false,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 262144,
"maxTokens": 8192
},
@@ -65,8 +100,15 @@
"id": "Qwen/Qwen2.5-Coder-32B-Instruct-AWQ",
"name": "Qwen2.5 Coder 32B [vm]",
"reasoning": false,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 32768,
"maxTokens": 8192
},
@@ -74,8 +116,15 @@
"id": "QuantTrio/Qwen3-Coder-30B-A3B-Instruct-AWQ",
"name": "Qwen3 Coder 30B [vm]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 65536,
"maxTokens": 8192,
"compat": {
@@ -89,8 +138,15 @@
"id": "casperhansen/deepseek-r1-distill-qwen-32b-awq",
"name": "DeepSeek-R1-Distill 32B [vm]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 32768,
"maxTokens": 8192
},
@@ -98,8 +154,15 @@
"id": "Qwen/Qwen3-32B-AWQ",
"name": "Qwen3 32B [vm]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 32768,
"maxTokens": 8192,
"compat": {
@@ -113,8 +176,15 @@
"id": "cyankiwi/Devstral-Small-2507-AWQ-4bit",
"name": "Devstral Small 2507 [vm]",
"reasoning": false,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 32768,
"maxTokens": 8192
}
@@ -134,8 +204,15 @@
"id": "cyankiwi/gemma-4-31B-it-AWQ-4bit",
"name": "Gemma 4 31B IT [vm1]",
"reasoning": false,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 131072,
"maxTokens": 8192
},
@@ -143,17 +220,31 @@
"id": "cyankiwi/NVIDIA-Nemotron-3-Super-120B-A12B-AWQ-4bit",
"name": "Nemotron 3 Super 120B 1M [vm1]",
"reasoning": false,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 1048576,
"maxTokens": 8192
},
{
- "id": "bullpoint/Qwen3-Coder-Next-AWQ-4bit",
- "name": "Qwen3 Coder Next [vm1]",
+ "id": "Qwen/Qwen3.6-27B-FP8",
+ "name": "Qwen3.6 27B FP8 [vm1]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 262144,
"maxTokens": 8192,
"compat": {
@@ -167,8 +258,15 @@
"id": "openai/gpt-oss-20b",
"name": "GPT-OSS 20B [vm1]",
"reasoning": false,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 65536,
"maxTokens": 8192
},
@@ -176,8 +274,15 @@
"id": "openai/gpt-oss-120b",
"name": "GPT-OSS 120B [vm1]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 131072,
"maxTokens": 8192
},
@@ -185,8 +290,15 @@
"id": "Qwen/Qwen2.5-Coder-32B-Instruct-AWQ",
"name": "Qwen2.5 Coder 32B [vm1]",
"reasoning": false,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 32768,
"maxTokens": 8192
},
@@ -194,8 +306,15 @@
"id": "QuantTrio/Qwen3-Coder-30B-A3B-Instruct-AWQ",
"name": "Qwen3 Coder 30B [vm1]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 65536,
"maxTokens": 8192,
"compat": {
@@ -209,8 +328,15 @@
"id": "casperhansen/deepseek-r1-distill-qwen-32b-awq",
"name": "DeepSeek-R1-Distill 32B [vm1]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 32768,
"maxTokens": 8192
},
@@ -218,8 +344,15 @@
"id": "Qwen/Qwen3-32B-AWQ",
"name": "Qwen3 32B [vm1]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 32768,
"maxTokens": 8192,
"compat": {
@@ -233,8 +366,15 @@
"id": "cyankiwi/Devstral-Small-2507-AWQ-4bit",
"name": "Devstral Small 2507 [vm1]",
"reasoning": false,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 32768,
"maxTokens": 8192
}
@@ -254,8 +394,15 @@
"id": "Qwen/Qwen3.6-27B-FP8",
"name": "Qwen3.6 27B FP8 [vm2]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 262144,
"maxTokens": 8192,
"compat": {
@@ -269,17 +416,31 @@
"id": "cyankiwi/gemma-4-31B-it-AWQ-4bit",
"name": "Gemma 4 31B IT [vm2]",
"reasoning": false,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 131072,
"maxTokens": 8192
},
{
- "id": "bullpoint/Qwen3-Coder-Next-AWQ-4bit",
- "name": "Qwen3 Coder Next [vm2]",
+ "id": "Qwen/Qwen3.6-27B-FP8",
+ "name": "Qwen3.6 27B FP8 [vm2]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 262144,
"maxTokens": 8192,
"compat": {
@@ -293,8 +454,15 @@
"id": "cyankiwi/NVIDIA-Nemotron-3-Super-120B-A12B-AWQ-4bit",
"name": "Nemotron 3 Super 120B [vm2]",
"reasoning": false,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 262144,
"maxTokens": 8192
},
@@ -302,8 +470,15 @@
"id": "openai/gpt-oss-20b",
"name": "GPT-OSS 20B [vm2]",
"reasoning": false,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 65536,
"maxTokens": 8192
},
@@ -311,8 +486,15 @@
"id": "openai/gpt-oss-120b",
"name": "GPT-OSS 120B [vm2]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 131072,
"maxTokens": 8192
},
@@ -320,8 +502,15 @@
"id": "Qwen/Qwen2.5-Coder-32B-Instruct-AWQ",
"name": "Qwen2.5 Coder 32B [vm2]",
"reasoning": false,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 32768,
"maxTokens": 8192
},
@@ -329,8 +518,15 @@
"id": "QuantTrio/Qwen3-Coder-30B-A3B-Instruct-AWQ",
"name": "Qwen3 Coder 30B [vm2]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 65536,
"maxTokens": 8192,
"compat": {
@@ -344,8 +540,15 @@
"id": "casperhansen/deepseek-r1-distill-qwen-32b-awq",
"name": "DeepSeek-R1-Distill 32B [vm2]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 32768,
"maxTokens": 8192
},
@@ -353,8 +556,15 @@
"id": "Qwen/Qwen3-32B-AWQ",
"name": "Qwen3 32B [vm2]",
"reasoning": true,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 32768,
"maxTokens": 8192,
"compat": {
@@ -368,8 +578,15 @@
"id": "cyankiwi/Devstral-Small-2507-AWQ-4bit",
"name": "Devstral Small 2507 [vm2]",
"reasoning": false,
- "input": ["text"],
- "cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
+ "input": [
+ "text"
+ ],
+ "cost": {
+ "input": 0,
+ "output": 0,
+ "cacheRead": 0,
+ "cacheWrite": 0
+ },
"contextWindow": 32768,
"maxTokens": 8192
}