phase 17: disable qwen3.5 thinking mode (think:false) to reduce latency and improve structured output

This commit is contained in:
Celes Renata
2026-04-12 12:35:24 -07:00
parent 45f0c03639
commit 6e2f174b19
+1
View File
@@ -220,6 +220,7 @@ class OllamaClient:
],
"format": json_schema,
"stream": False,
"think": False,
}
url = f"{self._config.base_url}/api/chat"