summaryrefslogtreecommitdiffhomepage
diff options
context:
space:
mode:
authorJohannes Loher <[email protected]>2026-03-18 05:52:16 +0100
committerGitHub <[email protected]>2026-03-17 23:52:16 -0500
commit56102ff6422ceafdeb349ba12bb08691660471bb (patch)
tree8b647d1d63286d7ad447d039e2ff22941654488a
parent1b86c27fb8d5b96e09cab48ad33ce08f381652cb (diff)
downloadopencode-56102ff6422ceafdeb349ba12bb08691660471bb.tar.gz
opencode-56102ff6422ceafdeb349ba12bb08691660471bb.zip
fix(core): detect vLLM context overflow errors (#17763)
Co-authored-by: Aiden Cline <[email protected]>
-rw-r--r--packages/opencode/src/provider/error.ts4
1 files changed, 3 insertions, 1 deletions
diff --git a/packages/opencode/src/provider/error.ts b/packages/opencode/src/provider/error.ts
index dd2554489..7a171f4db 100644
--- a/packages/opencode/src/provider/error.ts
+++ b/packages/opencode/src/provider/error.ts
@@ -13,7 +13,7 @@ export namespace ProviderError {
/input token count.*exceeds the maximum/i, // Google (Gemini)
/maximum prompt length is \d+/i, // xAI (Grok)
/reduce the length of the messages/i, // Groq
- /maximum context length is \d+ tokens/i, // OpenRouter, DeepSeek
+ /maximum context length is \d+ tokens/i, // OpenRouter, DeepSeek, vLLM
/exceeds the limit of \d+/i, // GitHub Copilot
/exceeds the available context size/i, // llama.cpp server
/greater than the context length/i, // LM Studio
@@ -21,6 +21,8 @@ export namespace ProviderError {
/exceeded model token limit/i, // Kimi For Coding, Moonshot
/context[_ ]length[_ ]exceeded/i, // Generic fallback
/request entity too large/i, // HTTP 413
+ /context length is only \d+ tokens/i, // vLLM
+ /input length.*exceeds.*context length/i, // vLLM
]
function isOpenAiErrorRetryable(e: APICallError) {