phase 17: disable qwen3.5 thinking mode (think:false) to reduce latency and improve structured output

2026-04-12 12:35:24 -07:00
parent 45f0c03639
commit 6e2f174b19
1 changed files with 1 additions and 0 deletions
@@ -220,6 +220,7 @@ class OllamaClient:
            ],
            "format": json_schema,
            "stream": False,
+            "think": False,
        }

        url = f"{self._config.base_url}/api/chat"