Merge d6396ac86f5d5f0eecd8dbda89c6bcd7314e6b7d into 5e417b44e1540f528d2ae63e3e20229a902d1db2

2026-03-21 02:55:25 +00:00 · 2026-03-21 02:55:25 +00:00 · f83eba1095
commit f83eba1095
parent 5e417b44e1 d6396ac86f
2 changed files with 67 additions and 0 deletions
--- a/src/agents/ollama-stream.test.ts
+++ b/src/agents/ollama-stream.test.ts
@ -544,6 +544,60 @@ describe("createOllamaStreamFn", () => {
      [{ type: "text", text: "final answer" }],
    );
  });
+
+  it("sends think:true when reasoning level is set", async () => {
+    await withMockNdjsonFetch(
+      [
+        '{"model":"m","created_at":"t","message":{"role":"assistant","content":"ok"},"done":false}',
+        '{"model":"m","created_at":"t","message":{"role":"assistant","content":""},"done":true,"prompt_eval_count":1,"eval_count":1}',
+      ],
+      async (fetchMock) => {
+        const streamFn = createOllamaStreamFn("http://ollama-host:11434");
+        const stream = await streamFn(
+          {
+            id: "deepseek-r1:32b",
+            api: "ollama",
+            provider: "ollama",
+            contextWindow: 131072,
+          } as never,
+          { messages: [{ role: "user", content: "hello" }] } as never,
+          { reasoning: "medium" } as never,
+        );
+        await collectStreamEvents(stream);
+
+        const [, reqInit] = fetchMock.mock.calls[0] as unknown as [string, RequestInit];
+        const body = JSON.parse(reqInit.body as string) as { think?: boolean };
+        expect(body.think).toBe(true);
+      },
+    );
+  });
+
+  it("sends think:false when reasoning is not set but options are present", async () => {
+    await withMockNdjsonFetch(
+      [
+        '{"model":"m","created_at":"t","message":{"role":"assistant","content":"ok"},"done":false}',
+        '{"model":"m","created_at":"t","message":{"role":"assistant","content":""},"done":true,"prompt_eval_count":1,"eval_count":1}',
+      ],
+      async (fetchMock) => {
+        const streamFn = createOllamaStreamFn("http://ollama-host:11434");
+        const stream = await streamFn(
+          {
+            id: "deepseek-r1:32b",
+            api: "ollama",
+            provider: "ollama",
+            contextWindow: 131072,
+          } as never,
+          { messages: [{ role: "user", content: "hello" }] } as never,
+          {} as never,
+        );
+        await collectStreamEvents(stream);
+
+        const [, reqInit] = fetchMock.mock.calls[0] as unknown as [string, RequestInit];
+        const body = JSON.parse(reqInit.body as string) as { think?: boolean };
+        expect(body.think).toBe(false);
+      },
+    );
+  });
 });

 describe("resolveOllamaBaseUrlForRun", () => {
--- a/src/agents/ollama-stream.ts
+++ b/src/agents/ollama-stream.ts
@ -42,6 +42,7 @@ interface OllamaChatRequest {
  model: string;
  messages: OllamaChatMessage[];
  stream: boolean;
+  think?: boolean;
  tools?: OllamaTool[];
  options?: Record<string, unknown>;
 }
@ -459,10 +460,22 @@ export function createOllamaStreamFn(
          ollamaOptions.num_predict = options.maxTokens;
        }

+        // Ollama thinking models (e.g. deepseek-r1, qwq) respect a top-level
+        // `think` boolean. Forward the reasoning level so `think: false` is
+        // sent explicitly when thinking is disabled (#46680).
+        const thinkParam: { think?: boolean } = {};
+        if (options?.reasoning) {
+          thinkParam.think = true;
+        } else if (options) {
+          // Thinking explicitly disabled – tell Ollama not to think.
+          thinkParam.think = false;
+        }
+
        const body: OllamaChatRequest = {
          model: model.id,
          messages: ollamaMessages,
          stream: true,
+          ...thinkParam,
          ...(ollamaTools.length > 0 ? { tools: ollamaTools } : {}),
          options: ollamaOptions,
        };