fix: set num_predict=16384 so model has token budget for thinking + content
This commit is contained in:
@@ -227,6 +227,9 @@ class OllamaClient:
|
|||||||
],
|
],
|
||||||
"format": json_schema,
|
"format": json_schema,
|
||||||
"stream": False,
|
"stream": False,
|
||||||
|
"options": {
|
||||||
|
"num_predict": 16384,
|
||||||
|
},
|
||||||
}
|
}
|
||||||
|
|
||||||
url = f"{self._config.base_url}/api/chat"
|
url = f"{self._config.base_url}/api/chat"
|
||||||
|
|||||||
Reference in New Issue
Block a user