From d2870c4b34cb2a61e47ef146f5a4705b48d4eac3 Mon Sep 17 00:00:00 2001 From: Advait Jayant Date: Wed, 24 Jun 2026 22:07:52 +0100 Subject: [PATCH] Raise hosted context window from 64K to 128K The banner's '65.5K' came from a flat context_length: 65536 in the config (the model block + the opengradient provider), not from the model -- so the harness compacted at 64K even though every hosted model handles far more. DeepSeek V4 Pro and Hermes 4 405B/70B are all >=128K native, so bump both hosted entries to 131072. Conservative on purpose (won't over-send past the gateway); can go higher if the gateway serves the full window. Local (ollama) windows unchanged. --- profile/config.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/profile/config.yaml b/profile/config.yaml index 7af5982..2fa5ca4 100644 --- a/profile/config.yaml +++ b/profile/config.yaml @@ -2,7 +2,7 @@ model: base_url: http://127.0.0.1:8788/v1 default: deepseek/deepseek-v4-pro provider: opengradient - context_length: 65536 + context_length: 131072 ollama_num_ctx: 65536 fallback_model: provider: ollama-local @@ -18,7 +18,7 @@ providers: base_url: http://127.0.0.1:8788/v1 api_key: managed-by-og-veil default_model: deepseek/deepseek-v4-pro - context_length: 65536 + context_length: 131072 ollama-local: base_url: http://localhost:11434/v1 api_key: ollama