Merge pull request #24 from southseact-3d/codex/fix-multiple-request-counting-issue

Limit tool-run loop for Chutes-like OpenAI routes and add regression test
2026-02-12 09:41:22 +00:00
parent b313994578 6a133b3038
commit f61ade810a
2 changed files with 155 additions and 2 deletions
--- a/opencode/packages/opencode/src/session/llm.ts
+++ b/opencode/packages/opencode/src/session/llm.ts
@@ -73,6 +73,13 @@ export namespace LLM {
    retryState: RetryState,
  ): Promise<StreamOutput> {
    const { getLanguage, cfg, provider, auth, isCodex, system, params, options, headers, maxOutputTokens, tools, rateLimitConfig } = config
+    const activeTools = Object.keys(tools).filter((x) => x !== "invalid")
+    const singleStepTools = shouldLimitToolLoop({
+      model: input.model,
+      provider,
+      options,
+      activeTools,
+    })

    while (retryState.attempt <= (rateLimitConfig.maxRetries || 0)) {
      try {
@@ -115,10 +122,10 @@ export namespace LLM {
          topP: params.topP,
          topK: params.topK,
          providerOptions: ProviderTransform.providerOptions(input.model, params.options),
-          activeTools: Object.keys(tools).filter((x) => x !== "invalid"),
+          activeTools,
          tools,
          // Chutes accounts each provider round-trip as a separate request, so keep SDK orchestration to one step.
-          stopWhen: input.model.providerID === "chutes" ? stepCountIs(1) : undefined,
+          stopWhen: singleStepTools ? stepCountIs(1) : undefined,
          maxOutputTokens,
          abortSignal: input.abort,
          headers: {
@@ -467,4 +474,26 @@ export namespace LLM {
    }
    return false
  }
+
+  function shouldLimitToolLoop(input: {
+    model: Provider.Model
+    provider: Provider.Info
+    options: Record<string, any>
+    activeTools: string[]
+  }) {
+    if (input.activeTools.length === 0) return false
+    if (input.model.providerID === "chutes") return true
+
+    const url = [
+      input.model.api.url,
+      input.provider.options?.baseURL,
+      input.provider.options?.baseUrl,
+      input.options?.baseURL,
+      input.options?.baseUrl,
+    ]
+      .filter((x) => typeof x === "string")
+      .map((x) => x.toLowerCase())
+
+    return url.some((x) => x.includes("chutes.ai") || x.includes("/chutes/"))
+  }
 }
--- a/opencode/packages/opencode/test/session/llm.test.ts
+++ b/opencode/packages/opencode/test/session/llm.test.ts
@@ -704,6 +704,130 @@ describe("session.llm.stream", () => {
    })
  })

+  test("limits tool runs to a single SDK step when OpenAI provider targets Chutes baseURL", async () => {
+    const server = state.server
+    if (!server) throw new Error("Server not initialized")
+
+    const providerID = "openai"
+    const modelID = "gpt-4o-mini"
+    const fixture = await loadFixture(providerID, modelID)
+    const model = fixture.model
+
+    const request = waitRequest(
+      "/chat/completions",
+      createEventResponse(
+        [
+          {
+            id: "chatcmpl-1",
+            object: "chat.completion.chunk",
+            choices: [{ delta: { role: "assistant" } }],
+          },
+          {
+            id: "chatcmpl-1",
+            object: "chat.completion.chunk",
+            choices: [
+              {
+                delta: {
+                  tool_calls: [
+                    {
+                      index: 0,
+                      id: "call_1",
+                      type: "function",
+                      function: {
+                        name: "echo",
+                        arguments: '{"value":"hello"}',
+                      },
+                    },
+                  ],
+                },
+              },
+            ],
+          },
+          {
+            id: "chatcmpl-1",
+            object: "chat.completion.chunk",
+            choices: [{ delta: {}, finish_reason: "tool_calls" }],
+          },
+        ],
+        true,
+      ),
+    )
+
+    await using tmp = await tmpdir({
+      init: async (dir) => {
+        await Bun.write(
+          path.join(dir, "opencode.json"),
+          JSON.stringify({
+            $schema: "https://opencode.ai/config.json",
+            enabled_providers: [providerID],
+            provider: {
+              [providerID]: {
+                options: {
+                  apiKey: "test-openai-key",
+                  baseURL: `${server.url.origin}/chutes/v1`,
+                },
+              },
+            },
+          }),
+        )
+      },
+    })
+
+    await Instance.provide({
+      directory: tmp.path,
+      fn: async () => {
+        const resolved = await Provider.getModel(providerID, model.id)
+        const sessionID = "session-test-6"
+        const agent = {
+          name: "test",
+          mode: "primary",
+          options: {},
+          permission: [{ permission: "*", pattern: "*", action: "allow" }],
+          temperature: 0.4,
+        } satisfies Agent.Info
+
+        const user = {
+          id: "user-6",
+          sessionID,
+          role: "user",
+          time: { created: Date.now() },
+          agent: agent.name,
+          model: { providerID, modelID: resolved.id },
+        } satisfies MessageV2.User
+
+        const stream = await LLM.stream({
+          user,
+          sessionID,
+          model: resolved,
+          agent,
+          system: ["You are a helpful assistant."],
+          abort: new AbortController().signal,
+          messages: [{ role: "user", content: "Use echo" }],
+          tools: {
+            echo: tool({
+              inputSchema: jsonSchema({
+                type: "object",
+                properties: {
+                  value: { type: "string" },
+                },
+                required: ["value"],
+                additionalProperties: false,
+              }),
+              execute: async () => "ok",
+            }),
+          },
+        })
+
+        for await (const _ of stream.fullStream) {
+        }
+
+        const capture = await request
+        expect(capture.url.pathname.endsWith("/chat/completions")).toBe(true)
+        expect(state.queue.length).toBe(0)
+      },
+    })
+  })
+
  test("sends Google API payload for Gemini models", async () => {
    const server = state.server
    if (!server) {