fix: max output tokens when using large thinking budget (#2976)

2026-04-09 18:29:39 +00:00 · 2025-10-04 23:38:41 -05:00
parent 5f7ae6477b
commit 71a7e8ef36
2 changed files with 26 additions and 10 deletions
--- a/packages/opencode/src/provider/transform.ts
+++ b/packages/opencode/src/provider/transform.ts
@@ -105,18 +105,29 @@ export namespace ProviderTransform {
    return result
  }

-  export function maxOutputTokens(providerID: string, outputLimit: number, options: Record<string, any>): number {
+  export function maxOutputTokens(
+    providerID: string,
+    options: Record<string, any>,
+    modelLimit: number,
+    globalLimit: number,
+  ): number {
+    const modelCap = modelLimit || globalLimit
+    const standardLimit = Math.min(modelCap, globalLimit)
+
    if (providerID === "anthropic") {
-      const thinking = options["thinking"]
-      if (typeof thinking === "object" && thinking !== null) {
-        const type = thinking["type"]
-        const budgetTokens = thinking["budgetTokens"]
-        if (type === "enabled" && typeof budgetTokens === "number" && budgetTokens > 0) {
-          return outputLimit - budgetTokens
+      const thinking = options?.["thinking"]
+      const budgetTokens = typeof thinking?.["budgetTokens"] === "number" ? thinking["budgetTokens"] : 0
+      const enabled = thinking?.["type"] === "enabled"
+      if (enabled && budgetTokens > 0) {
+        // Return text tokens so that text + thinking <= model cap, preferring 32k text when possible.
+        if (budgetTokens + standardLimit <= modelCap) {
+          return standardLimit
        }
+        return modelCap - budgetTokens
      }
    }
-    return outputLimit
+
+    return standardLimit
  }

  export function schema(_providerID: string, _modelID: string, schema: JSONSchema.BaseSchema) {