From 4f2ae23d4269255365a286fcb8b10bb9fccb0fdd Mon Sep 17 00:00:00 2001 From: Celes Renata Date: Wed, 15 Apr 2026 01:47:00 +0000 Subject: [PATCH] fix: set num_predict=16384 so model has token budget for thinking + content --- services/extractor/client.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/services/extractor/client.py b/services/extractor/client.py index 64efd99..21a57c0 100644 --- a/services/extractor/client.py +++ b/services/extractor/client.py @@ -227,6 +227,9 @@ class OllamaClient: ], "format": json_schema, "stream": False, + "options": { + "num_predict": 16384, + }, } url = f"{self._config.base_url}/api/chat"