fix(ai): use enable_thinking for Z.ai instead of thinking param (#1674)

Z.ai uses the same enable_thinking: boolean parameter as Qwen to control reasoning, not thinking: { type: "enabled" | "disabled" }. The wrong parameter name means Z.ai ignores the disable request and always runs with thinking enabled, wasting tokens and adding latency. Merge the Z.ai and Qwen branches since they use the same format. PR by @okuyam2y
2026-04-15 13:03:42 +00:00 · 2026-02-28 05:33:14 +09:00 · 2026-02-28 05:33:14 +09:00 · 22b3be834e
commit 22b3be834e
parent 8880cd3cb8
1 changed files with 2 additions and 6 deletions
--- a/packages/ai/src/providers/openai-completions.ts
+++ b/packages/ai/src/providers/openai-completions.ts
@ -423,12 +423,8 @@ function buildParams(model: Model<"openai-completions">, context: Context, optio
 		params.tool_choice = options.toolChoice;
 	}

-	if (compat.thinkingFormat === "zai" && model.reasoning) {
-		// Z.ai uses binary thinking: { type: "enabled" | "disabled" }
-		// Must explicitly disable since z.ai defaults to thinking enabled
-		(params as any).thinking = { type: options?.reasoningEffort ? "enabled" : "disabled" };
-	} else if (compat.thinkingFormat === "qwen" && model.reasoning) {
-		// Qwen uses enable_thinking: boolean
+	if ((compat.thinkingFormat === "zai" || compat.thinkingFormat === "qwen") && model.reasoning) {
+		// Both Z.ai and Qwen use enable_thinking: boolean
 		(params as any).enable_thinking = !!options?.reasoningEffort;
 	} else if (options?.reasoningEffort && model.reasoning && compat.supportsReasoningEffort) {
 		// OpenAI-style reasoning_effort