From d994eb751ef3bef126438eca75e9622ace1b8b23 Mon Sep 17 00:00:00 2001
From: Lee Faus <lee@weareatomic.dev>
Date: Tue, 23 Dec 2025 12:32:05 -0500
Subject: [PATCH 1/4] feat(middleware): add filtering for empty tool_calls in
 API responses

Introduced a new middleware to intercept API responses and filter out empty tool_calls arrays, preventing indefinite waits in the AI SDK. This includes handling both streaming and non-streaming responses. Additionally, updated the OpenAI-compatible provider to utilize this middleware and ensure proper cleanup of pending tool calls in session processing.
---
 .../src/openai-compatible-middleware.ts       | 226 ++++++++++++++++++
 .../src/openai-compatible-provider.ts         |  12 +-
 packages/opencode/src/session/processor.ts    |  38 ++-
 3 files changed, 273 insertions(+), 3 deletions(-)
 create mode 100644 packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts
diff --git a/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts b/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts
new file mode 100644
index 00000000000..245add53c7c
--- /dev/null
+++ b/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts
@@ -0,0 +1,226 @@
+import type { LanguageModelV2 } from "@ai-sdk/provider"
+import { wrapLanguageModel } from "ai"
+
+/**
+ * Wraps a fetch function to filter out empty tool_calls arrays from API responses.
+ * 
+ * LM Studio (and some other OpenAI-compatible providers) always include
+ * `tool_calls: []` in responses, even when no tools are called. This causes
+ * the AI SDK to wait indefinitely for tool execution. This function intercepts
+ * the fetch responses and removes empty tool_calls arrays when finish_reason is "stop".
+ */
+export function createFilteredFetch(originalFetch: typeof fetch): typeof fetch {
+  return async (input: RequestInfo | URL, init?: RequestInit): Promise<Response> => {
+    const response = await originalFetch(input, init)
+    
+    // Only process JSON responses from chat completions endpoints
+    const url = typeof input === "string" ? input : input instanceof URL ? input.toString() : input.url
+    if (!url.includes("/chat/completions")) {
+      return response
+    }
+    
+    const contentType = response.headers.get("content-type")
+    
+    // For streaming responses (text/event-stream), process the SSE stream
+    if (contentType && contentType.includes("text/event-stream")) {
+      const originalStream = response.body
+      if (!originalStream) {
+        return response
+      }
+        
+        const stream = new ReadableStream({
+          async start(controller) {
+            const reader = originalStream.getReader()
+            const decoder = new TextDecoder()
+            let buffer = ""
+            
+            try {
+              while (true) {
+                const { done, value } = await reader.read()
+                if (done) break
+                
+                buffer += decoder.decode(value, { stream: true })
+                const chunks = buffer.split("\n\n")
+                buffer = chunks.pop() || ""
+                
+                for (const chunk of chunks) {
+                  if (chunk.startsWith("data: ")) {
+                    const data = chunk.slice(6).trim()
+                    if (data === "[DONE]") {
+                      controller.enqueue(new TextEncoder().encode("data: [DONE]\n\n"))
+                      continue
+                    }
+                    
+                    try {
+                      const json = JSON.parse(data)
+                      let modified = false
+                      
+                      // Process choices in the stream chunk
+                      if (json.choices && Array.isArray(json.choices)) {
+                        const modifiedChoices = json.choices.map((choice: any) => {
+                          // Check delta for empty tool_calls
+                          if (
+                            choice.delta &&
+                            Array.isArray(choice.delta.tool_calls) &&
+                            choice.delta.tool_calls.length === 0
+                          ) {
+                            modified = true
+                            const { tool_calls, ...rest } = choice.delta
+                            return {
+                              ...choice,
+                              delta: rest,
+                            }
+                          }
+                          
+                          // Check message for empty tool_calls with stop finish_reason
+                          if (
+                            choice.message &&
+                            Array.isArray(choice.message.tool_calls) &&
+                            choice.message.tool_calls.length === 0 &&
+                            choice.finish_reason === "stop"
+                          ) {
+                            modified = true
+                            const { tool_calls, ...rest } = choice.message
+                            return {
+                              ...choice,
+                              message: rest,
+                            }
+                          }
+                          
+                          return choice
+                        })
+                        
+                        if (modified) {
+                          json.choices = modifiedChoices
+                          controller.enqueue(
+                            new TextEncoder().encode(`data: ${JSON.stringify(json)}\n\n`)
+                          )
+                          continue
+                        }
+                      }
+                      
+                      // No modification needed, pass through
+                      controller.enqueue(new TextEncoder().encode(`${chunk}\n\n`))
+                    } catch {
+                      // Not JSON or parse error, pass through
+                      controller.enqueue(new TextEncoder().encode(`${chunk}\n\n`))
+                    }
+                  } else if (chunk.trim()) {
+                    // Not a data line but has content, pass through
+                    controller.enqueue(new TextEncoder().encode(`${chunk}\n\n`))
+                  }
+                }
+              }
+              
+              // Flush remaining buffer
+              if (buffer.trim()) {
+                controller.enqueue(new TextEncoder().encode(buffer))
+              }
+              
+              controller.close()
+            } catch (error) {
+              controller.error(error)
+            }
+          },
+        })
+        
+        return new Response(stream, {
+          status: response.status,
+          statusText: response.statusText,
+          headers: response.headers,
+        })
+      }
+      
+      // For non-streaming JSON responses
+      if (contentType && contentType.includes("application/json")) {
+        // Clone the response so we can read the body
+        const clonedResponse = response.clone()
+        
+        try {
+          const text = await clonedResponse.text()
+          let json: any
+          
+          try {
+            json = JSON.parse(text)
+          } catch {
+            // Not JSON, return original response
+            return response
+          }
+          
+          // Process non-streaming responses
+          if (json.choices && Array.isArray(json.choices)) {
+            let modified = false
+            const modifiedChoices = json.choices.map((choice: any) => {
+              if (
+                choice.message &&
+                Array.isArray(choice.message.tool_calls) &&
+                choice.message.tool_calls.length === 0 &&
+                choice.finish_reason === "stop"
+              ) {
+                modified = true
+                const { tool_calls, ...rest } = choice.message
+                return {
+                  ...choice,
+                  message: rest,
+                }
+              }
+              return choice
+            })
+            
+            if (modified) {
+              return new Response(JSON.stringify({ ...json, choices: modifiedChoices }), {
+                status: response.status,
+                statusText: response.statusText,
+                headers: response.headers,
+              })
+            }
+          }
+        } catch (error) {
+          // If anything goes wrong, return the original response
+          return response
+        }
+      }
+    
+    return response
+  }
+}
+
+/**
+ * Wraps a language model to filter out empty tool_calls from responses.
+ * This is a fallback approach that works at the model level.
+ */
+export function filterEmptyToolCalls<T extends LanguageModelV2>(model: T): T {
+  return wrapLanguageModel({
+    model,
+    middleware: [
+      {
+        async transformResult(result) {
+          // Handle non-streaming results
+          if (result.type === "generate") {
+            const content = result.content || []
+            // Filter out any tool-call items that don't have proper IDs
+            // This handles cases where empty tool_calls arrays were parsed
+            const filteredContent = content.filter((item) => {
+              if (item.type === "tool-call") {
+                // Only keep tool-calls that have valid IDs
+                return item.toolCallId && item.toolName
+              }
+              return true
+            })
+            
+            // If we filtered anything and finish_reason is "stop", use filtered content
+            if (filteredContent.length !== content.length && result.finishReason === "stop") {
+              return {
+                ...result,
+                content: filteredContent,
+              }
+            }
+          }
+          
+          return result
+        },
+      },
+    ],
+  }) as T
+}
+
diff --git a/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-provider.ts b/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-provider.ts
index e71658c2fa0..7e0a26cbe41 100644
--- a/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-provider.ts
+++ b/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-provider.ts
@@ -2,6 +2,7 @@ import type { LanguageModelV2 } from "@ai-sdk/provider"
 import { OpenAICompatibleChatLanguageModel } from "@ai-sdk/openai-compatible"
 import { type FetchFunction, withoutTrailingSlash, withUserAgentSuffix } from "@ai-sdk/provider-utils"
 import { OpenAIResponsesLanguageModel } from "./responses/openai-responses-language-model"
+import { createFilteredFetch, filterEmptyToolCalls } from "./openai-compatible-middleware"
 
 // Import the version or define it
 const VERSION = "0.1.0"
@@ -66,12 +67,19 @@ export function createOpenaiCompatible(options: OpenaiCompatibleProviderSettings
   const getHeaders = () => withUserAgentSuffix(headers, `ai-sdk/openai-compatible/${VERSION}`)
 
   const createChatModel = (modelId: OpenaiCompatibleModelId) => {
-    return new OpenAICompatibleChatLanguageModel(modelId, {
+    // Wrap the fetch function to filter empty tool_calls arrays
+    const originalFetch = options.fetch ?? fetch
+    const filteredFetch = createFilteredFetch(originalFetch)
+    
+    const baseModel = new OpenAICompatibleChatLanguageModel(modelId, {
       provider: `${options.name ?? "openai-compatible"}.chat`,
       headers: getHeaders,
       url: ({ path }) => `${baseURL}${path}`,
-      fetch: options.fetch,
+      fetch: filteredFetch,
     })
+    
+    // Also wrap the model with middleware as a fallback
+    return filterEmptyToolCalls(baseModel)
   }
 
   const createResponsesModel = (modelId: OpenaiCompatibleModelId) => {
diff --git a/packages/opencode/src/session/processor.ts b/packages/opencode/src/session/processor.ts
index 2f2ba4e944e..0e819017844 100644
--- a/packages/opencode/src/session/processor.ts
+++ b/packages/opencode/src/session/processor.ts
@@ -248,10 +248,46 @@ export namespace SessionProcessor {
                   input.assistantMessage.finish = value.finishReason
                   input.assistantMessage.cost += usage.cost
                   input.assistantMessage.tokens = usage.tokens
+                  
+                  // Fallback: If finish_reason is "stop" and we have pending tool calls
+                  // that were never invoked, clean them up. This handles cases where
+                  // providers (like LM Studio) send empty tool_calls arrays that cause
+                  // the AI SDK to create pending tool-call events that never complete.
+                  if (value.finishReason === "stop") {
+                    const parts = await MessageV2.parts(input.assistantMessage.id)
+                    for (const part of parts) {
+                      if (
+                        part.type === "tool" &&
+                        part.state.status === "pending" &&
+                        (!part.state.input || Object.keys(part.state.input).length === 0)
+                      ) {
+                        // This is a pending tool call that was never actually invoked
+                        // (empty input means it was created from an empty tool_calls array)
+                        // Remove it since finish_reason is "stop" and no tools were called
+                        const startTime = Date.now()
+                        await Session.updatePart({
+                          ...part,
+                          state: {
+                            status: "error",
+                            input: part.state.input,
+                            error: "Empty tool_calls array filtered",
+                            time: {
+                              start: startTime,
+                              end: Date.now(),
+                            },
+                          },
+                        })
+                        delete toolcalls[part.callID]
+                        delete toolStartTimes[part.callID]
+                      }
+                    }
+                  }
+                  
+                  const finishSnapshot = await Snapshot.track()
                   await Session.updatePart({
                     id: Identifier.ascending("part"),
                     reason: value.finishReason,
-                    snapshot: await Snapshot.track(),
+                    snapshot: finishSnapshot,
                     messageID: input.assistantMessage.id,
                     sessionID: input.assistantMessage.sessionID,
                     type: "step-finish",

From 36385cf7c7580d93f1ad3e72fb0f0313424c7a57 Mon Sep 17 00:00:00 2001
From: Lee Faus <lee@weareatomic.dev>
Date: Tue, 23 Dec 2025 13:05:48 -0500
Subject: [PATCH 2/4] refactor(middleware): streamline tool_calls filtering and
 update session processing

Updated the createFilteredFetch function to specify the return type and clarified the filtering mechanism for empty tool_calls. Removed unnecessary middleware wrapping in filterEmptyToolCalls, as filtering is now handled at the fetch level. Enhanced session processing to correctly handle empty tool_calls by updating the error state with the appropriate timestamps.
---
 .../src/openai-compatible-middleware.ts       | 41 ++++---------------
 1 file changed, 7 insertions(+), 34 deletions(-)

diff --git a/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts b/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts
index 245add53c7c..4f751b49352 100644
--- a/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts
+++ b/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts
@@ -9,7 +9,7 @@ import { wrapLanguageModel } from "ai"
  * the AI SDK to wait indefinitely for tool execution. This function intercepts
  * the fetch responses and removes empty tool_calls arrays when finish_reason is "stop".
  */
-export function createFilteredFetch(originalFetch: typeof fetch): typeof fetch {
+export function createFilteredFetch(originalFetch: typeof fetch): (input: RequestInfo | URL, init?: RequestInit) => Promise<Response> {
   return async (input: RequestInfo | URL, init?: RequestInit): Promise<Response> => {
     const response = await originalFetch(input, init)
     
@@ -187,40 +187,13 @@ export function createFilteredFetch(originalFetch: typeof fetch): typeof fetch {
 
 /**
  * Wraps a language model to filter out empty tool_calls from responses.
- * This is a fallback approach that works at the model level.
+ * Note: This is a placeholder - the actual filtering happens at the fetch level
+ * via createFilteredFetch. This function just returns the model as-is since
+ * wrapLanguageModel middleware only supports transformParams, not transformResult.
  */
 export function filterEmptyToolCalls<T extends LanguageModelV2>(model: T): T {
-  return wrapLanguageModel({
-    model,
-    middleware: [
-      {
-        async transformResult(result) {
-          // Handle non-streaming results
-          if (result.type === "generate") {
-            const content = result.content || []
-            // Filter out any tool-call items that don't have proper IDs
-            // This handles cases where empty tool_calls arrays were parsed
-            const filteredContent = content.filter((item) => {
-              if (item.type === "tool-call") {
-                // Only keep tool-calls that have valid IDs
-                return item.toolCallId && item.toolName
-              }
-              return true
-            })
-            
-            // If we filtered anything and finish_reason is "stop", use filtered content
-            if (filteredContent.length !== content.length && result.finishReason === "stop") {
-              return {
-                ...result,
-                content: filteredContent,
-              }
-            }
-          }
-          
-          return result
-        },
-      },
-    ],
-  }) as T
+  // The filtering is handled at the fetch level in createFilteredFetch
+  // No need to wrap with middleware since transformResult is not supported
+  return model
 }
 

From 5a96eec23d3d9d155fbaf5a7e0432a565b36bec1 Mon Sep 17 00:00:00 2001
From: Lee Faus <lee@weareatomic.dev>
Date: Tue, 23 Dec 2025 13:23:16 -0500
Subject: [PATCH 3/4] fix: resolve TypeScript errors in cherry-picked commits

---
 .../openai-compatible/src/openai-compatible-middleware.ts    | 5 +++--
 packages/opencode/src/session/processor.ts                   | 1 -
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts b/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts
index 4f751b49352..72f94c65653 100644
--- a/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts
+++ b/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts
@@ -9,8 +9,8 @@ import { wrapLanguageModel } from "ai"
  * the AI SDK to wait indefinitely for tool execution. This function intercepts
  * the fetch responses and removes empty tool_calls arrays when finish_reason is "stop".
  */
-export function createFilteredFetch(originalFetch: typeof fetch): (input: RequestInfo | URL, init?: RequestInit) => Promise<Response> {
-  return async (input: RequestInfo | URL, init?: RequestInit): Promise<Response> => {
+export function createFilteredFetch(originalFetch: typeof fetch): typeof fetch {
+  const filteredFetch = async (input: RequestInfo | URL, init?: RequestInit): Promise<Response> => {
     const response = await originalFetch(input, init)
     
     // Only process JSON responses from chat completions endpoints
@@ -183,6 +183,7 @@ export function createFilteredFetch(originalFetch: typeof fetch): (input: Reques
     
     return response
   }
+  return filteredFetch as typeof fetch
 }
 
 /**
diff --git a/packages/opencode/src/session/processor.ts b/packages/opencode/src/session/processor.ts
index 0e819017844..b79c01c18fa 100644
--- a/packages/opencode/src/session/processor.ts
+++ b/packages/opencode/src/session/processor.ts
@@ -278,7 +278,6 @@ export namespace SessionProcessor {
                           },
                         })
                         delete toolcalls[part.callID]
-                        delete toolStartTimes[part.callID]
                       }
                     }
                   }

From 49915e9879ec1d4a7ee50a58506e5593b37333ae Mon Sep 17 00:00:00 2001
From: Lee Faus <lee@weareatomic.dev>
Date: Fri, 26 Dec 2025 11:24:00 -0500
Subject: [PATCH 4/4] filtering for just lm-studio

---
 packages/opencode/bin/opencode                | 46 ++++++++++---------
 .../src/openai-compatible-middleware.ts       | 17 +------
 .../src/openai-compatible-provider.ts         | 18 ++++++--
 3 files changed, 39 insertions(+), 42 deletions(-)

diff --git a/packages/opencode/bin/opencode b/packages/opencode/bin/opencode
index e35cc00944d..368cd7e39e9 100755
--- a/packages/opencode/bin/opencode
+++ b/packages/opencode/bin/opencode
@@ -1,12 +1,15 @@
 #!/usr/bin/env node
 
-const childProcess = require("child_process")
-const fs = require("fs")
-const path = require("path")
-const os = require("os")
+import { spawnSync } from "child_process"
+import { realpathSync, existsSync, readdirSync } from "fs"
+import { dirname, join } from "path"
+import { platform, arch } from "os"
+import { fileURLToPath } from "url"
+
+const __filename = fileURLToPath(import.meta.url)
 
 function run(target) {
-  const result = childProcess.spawnSync(target, process.argv.slice(2), {
+  const result = spawnSync(target, process.argv.slice(2), {
     stdio: "inherit",
   })
   if (result.error) {
@@ -21,9 +24,8 @@ const envPath = process.env.OPENCODE_BIN_PATH
 if (envPath) {
   run(envPath)
 }
-
-const scriptPath = fs.realpathSync(__filename)
-const scriptDir = path.dirname(scriptPath)
+const scriptPath = realpathSync(__filename)
+const scriptDir = dirname(scriptPath)
 
 const platformMap = {
   darwin: "darwin",
@@ -36,34 +38,34 @@ const archMap = {
   arm: "arm",
 }
 
-let platform = platformMap[os.platform()]
-if (!platform) {
-  platform = os.platform()
+let platformName = platformMap[platform()]
+if (!platformName) {
+  platformName = platform()
 }
-let arch = archMap[os.arch()]
-if (!arch) {
-  arch = os.arch()
+let archName = archMap[arch()]
+if (!archName) {
+  archName = arch()
 }
-const base = "opencode-" + platform + "-" + arch
-const binary = platform === "windows" ? "opencode.exe" : "opencode"
+const base = "opencode-" + platformName + "-" + archName
+const binary = platformName === "windows" ? "opencode.exe" : "opencode"
 
 function findBinary(startDir) {
   let current = startDir
   for (;;) {
-    const modules = path.join(current, "node_modules")
-    if (fs.existsSync(modules)) {
-      const entries = fs.readdirSync(modules)
+    const modules = join(current, "node_modules")
+    if (existsSync(modules)) {
+      const entries = readdirSync(modules)
       for (const entry of entries) {
         if (!entry.startsWith(base)) {
           continue
         }
-        const candidate = path.join(modules, entry, "bin", binary)
-        if (fs.existsSync(candidate)) {
+        const candidate = join(modules, entry, "bin", binary)
+        if (existsSync(candidate)) {
           return candidate
         }
       }
     }
-    const parent = path.dirname(current)
+    const parent = dirname(current)
     if (parent === current) {
       return
     }
diff --git a/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts b/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts
index 72f94c65653..2228b38959a 100644
--- a/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts
+++ b/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-middleware.ts
@@ -58,21 +58,8 @@ export function createFilteredFetch(originalFetch: typeof fetch): typeof fetch {
                       // Process choices in the stream chunk
                       if (json.choices && Array.isArray(json.choices)) {
                         const modifiedChoices = json.choices.map((choice: any) => {
-                          // Check delta for empty tool_calls
-                          if (
-                            choice.delta &&
-                            Array.isArray(choice.delta.tool_calls) &&
-                            choice.delta.tool_calls.length === 0
-                          ) {
-                            modified = true
-                            const { tool_calls, ...rest } = choice.delta
-                            return {
-                              ...choice,
-                              delta: rest,
-                            }
-                          }
-                          
-                          // Check message for empty tool_calls with stop finish_reason
+                          // Only filter empty tool_calls from the final message when finish_reason is "stop"
+                          // Don't filter from deltas during streaming as they might be part of valid tool call streams
                           if (
                             choice.message &&
                             Array.isArray(choice.message.tool_calls) &&
diff --git a/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-provider.ts b/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-provider.ts
index 7e0a26cbe41..e0e050800fe 100644
--- a/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-provider.ts
+++ b/packages/opencode/src/provider/sdk/openai-compatible/src/openai-compatible-provider.ts
@@ -67,19 +67,27 @@ export function createOpenaiCompatible(options: OpenaiCompatibleProviderSettings
   const getHeaders = () => withUserAgentSuffix(headers, `ai-sdk/openai-compatible/${VERSION}`)
 
   const createChatModel = (modelId: OpenaiCompatibleModelId) => {
-    // Wrap the fetch function to filter empty tool_calls arrays
     const originalFetch = options.fetch ?? fetch
-    const filteredFetch = createFilteredFetch(originalFetch)
+    
+    // Only apply empty tool_calls filtering for LM Studio
+    // Detect LM Studio by checking baseURL (localhost) or provider name
+    const isLMStudio = 
+      baseURL.includes("localhost") || 
+      baseURL.includes("127.0.0.1") ||
+      options.name?.toLowerCase().includes("lm-studio") ||
+      options.name?.toLowerCase().includes("lmstudio")
+    
+    const fetchToUse = isLMStudio ? createFilteredFetch(originalFetch) : originalFetch
     
     const baseModel = new OpenAICompatibleChatLanguageModel(modelId, {
       provider: `${options.name ?? "openai-compatible"}.chat`,
       headers: getHeaders,
       url: ({ path }) => `${baseURL}${path}`,
-      fetch: filteredFetch,
+      fetch: fetchToUse,
     })
     
-    // Also wrap the model with middleware as a fallback
-    return filterEmptyToolCalls(baseModel)
+    // Only wrap with middleware for LM Studio
+    return isLMStudio ? filterEmptyToolCalls(baseModel) : baseModel
   }
 
   const createResponsesModel = (modelId: OpenaiCompatibleModelId) => {