fix: set num_predict=16384 so model has token budget for thinking + content
This commit is contained in:
@@ -227,6 +227,9 @@ class OllamaClient:
|
||||
],
|
||||
"format": json_schema,
|
||||
"stream": False,
|
||||
"options": {
|
||||
"num_predict": 16384,
|
||||
},
|
||||
}
|
||||
|
||||
url = f"{self._config.base_url}/api/chat"
|
||||
|
||||
Reference in New Issue
Block a user