From affb65d7f47663f429117515b89ffcef77d1d3a9 Mon Sep 17 00:00:00 2001 From: Celes Renata Date: Fri, 1 May 2026 18:56:55 +0000 Subject: [PATCH] fix: point VLLM_BASE_URL to Ollama (10.1.1.12:2701) and update model name vLLM service on 192.168.42.254:8000 was down causing extraction failures. Also updated ai_agents table to use ollama provider directly. --- infra/helm/stonks-oracle/values.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/infra/helm/stonks-oracle/values.yaml b/infra/helm/stonks-oracle/values.yaml index cbd2d0f..7cebd7d 100644 --- a/infra/helm/stonks-oracle/values.yaml +++ b/infra/helm/stonks-oracle/values.yaml @@ -181,8 +181,8 @@ config: OLLAMA_RETRY_BASE_DELAY: "1.0" OLLAMA_RETRY_MAX_DELAY: "10.0" OLLAMA_RETRY_BACKOFF_MULTIPLIER: "2.0" - VLLM_BASE_URL: "http://192.168.42.254:8000" - VLLM_MODEL: "AxionML/Qwen3.5-9B-NVFP4" + VLLM_BASE_URL: "http://10.1.1.12:2701" + VLLM_MODEL: "qwen3.5:9b-fast" VLLM_TIMEOUT: "120" VLLM_MAX_RETRIES: "2" VLLM_TEMPERATURE: "0.7"