From 1122c9373cadb90d28b8d588e73f84b86237fd15 Mon Sep 17 00:00:00 2001 From: Paul Buetow Date: Wed, 18 Mar 2026 17:47:45 +0200 Subject: =?UTF-8?q?nemotron-super:=20use=20qwen3=5Fxml=20tool=20call=20par?= =?UTF-8?q?ser=20=E2=80=94=20same=20XML=20format,=20works?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Both Nemotron and Qwen3-XML use identical value format. qwen3_xml correctly parses Nemotron's output; tool calling now works with opencode and other API clients. Co-Authored-By: Claude Sonnet 4.6 (1M context) --- snippets/hyperstack/hyperstack-vm.toml | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) (limited to 'snippets/hyperstack/hyperstack-vm.toml') diff --git a/snippets/hyperstack/hyperstack-vm.toml b/snippets/hyperstack/hyperstack-vm.toml index e739d5f..4e47a76 100644 --- a/snippets/hyperstack/hyperstack-vm.toml +++ b/snippets/hyperstack/hyperstack-vm.toml @@ -94,16 +94,16 @@ tool_call_parser = "qwen3_coder" # Requires trust_remote_code=true for the nemotron_h architecture. # Note: cyankiwi AWQ has model_type="nemotron_nas" (underscore); vLLM keys on "nemotron-nas" # (hyphen), so vLLM may not recognise it without trust_remote_code and latest vLLM. -# Tool calling: Nemotron uses a custom XML format () -# not supported by any vLLM 0.17.1 built-in parser. tool_call_parser="" disables tool calling. -# Use for long-context analysis and reasoning; switch to qwen3-coder-next for agentic work. +# NVIDIA Nemotron-3-Super uses the same XML tool call format as Qwen3 XML: +# value +# qwen3_xml handles this format and is compatible with Nemotron's chat template. [vllm.presets.nemotron-super] model = "cyankiwi/NVIDIA-Nemotron-3-Super-120B-A12B-AWQ-4bit" container_name = "vllm_nemotron_super" max_model_len = 65536 gpu_memory_utilization = 0.92 tensor_parallel_size = 1 -tool_call_parser = "" +tool_call_parser = "qwen3_xml" trust_remote_code = true # nemotron_v3 reasoning parser exposes tokens as reasoning_content in the API. extra_vllm_args = ["--reasoning-parser", "nemotron_v3"] -- cgit v1.2.3