feat(ai): Implement Gemini provider with streaming and tool support

- Added GeminiLLM provider implementation with GoogleGenerativeAI SDK - Supports streaming with text/thinking content and completion signals - Handles Gemini's parts-based content system (text, thought, functionCall) - Implements tool/function calling with proper format conversion - Maps between unified types and Gemini-specific formats (model vs assistant role) - Added test example matching other provider patterns - Fixed typo in AssistantMessage type (stopResaon -> stopReason) across all providers
2026-04-16 16:00:58 +00:00 · 2025-08-24 20:41:10 +02:00 · 2025-08-24 20:41:10 +02:00 · a8ba19f0b4
commit a8ba19f0b4
parent cb4c32faaa
8 changed files with 360 additions and 14 deletions
--- a/packages/ai/src/providers/anthropic.ts
+++ b/packages/ai/src/providers/anthropic.ts
@ -186,7 +186,7 @@ export class AnthropicLLM implements LLM<AnthropicLLMOptions> {
 				toolCalls,
 				model: this.model,
 				usage,
-				stopResaon: this.mapStopReason(msg.stop_reason),
+				stopReason: this.mapStopReason(msg.stop_reason),
 			};
 		} catch (error) {
 			return {
@ -198,7 +198,7 @@ export class AnthropicLLM implements LLM<AnthropicLLMOptions> {
 					cacheRead: 0,
 					cacheWrite: 0,
 				},
-				stopResaon: "error",
+				stopReason: "error",
 				error: error instanceof Error ? error.message : String(error),
 			};
 		}
--- a/packages/ai/src/providers/gemini.ts
+++ b/packages/ai/src/providers/gemini.ts
@ -0,0 +1,264 @@
+import { FunctionCallingMode, GoogleGenerativeAI } from "@google/generative-ai";
+import type {
+	AssistantMessage,
+	Context,
+	LLM,
+	LLMOptions,
+	Message,
+	StopReason,
+	TokenUsage,
+	Tool,
+	ToolCall,
+} from "../types.js";
+
+export interface GeminiLLMOptions extends LLMOptions {
+	toolChoice?: "auto" | "none" | "any";
+}
+
+export class GeminiLLM implements LLM<GeminiLLMOptions> {
+	private client: GoogleGenerativeAI;
+	private model: string;
+
+	constructor(model: string, apiKey?: string) {
+		if (!apiKey) {
+			if (!process.env.GEMINI_API_KEY) {
+				throw new Error(
+					"Gemini API key is required. Set GEMINI_API_KEY environment variable or pass it as an argument.",
+				);
+			}
+			apiKey = process.env.GEMINI_API_KEY;
+		}
+		this.client = new GoogleGenerativeAI(apiKey);
+		this.model = model;
+	}
+
+	async complete(context: Context, options?: GeminiLLMOptions): Promise<AssistantMessage> {
+		try {
+			const model = this.client.getGenerativeModel({
+				model: this.model,
+				systemInstruction: context.systemPrompt,
+				tools: context.tools ? this.convertTools(context.tools) : undefined,
+				toolConfig: options?.toolChoice
+					? {
+							functionCallingConfig: {
+								mode: this.mapToolChoice(options.toolChoice),
+							},
+						}
+					: undefined,
+			});
+
+			const contents = this.convertMessages(context.messages);
+
+			const stream = await model.generateContentStream({
+				contents,
+				generationConfig: {
+					temperature: options?.temperature,
+					maxOutputTokens: options?.maxTokens,
+				},
+			});
+
+			let content = "";
+			let thinking = "";
+			const toolCalls: ToolCall[] = [];
+			let usage: TokenUsage = {
+				input: 0,
+				output: 0,
+				cacheRead: 0,
+				cacheWrite: 0,
+			};
+			let stopReason: StopReason = "stop";
+			let inTextBlock = false;
+			let inThinkingBlock = false;
+
+			// Process the stream
+			for await (const chunk of stream.stream) {
+				// Extract parts from the chunk
+				const candidate = chunk.candidates?.[0];
+				if (candidate?.content?.parts) {
+					for (const part of candidate.content.parts) {
+						if (part.text) {
+							// Check if it's thinking content
+							if ((part as any).thought) {
+								thinking += part.text;
+								options?.onThinking?.(part.text, false);
+								inThinkingBlock = true;
+								if (inTextBlock) {
+									options?.onText?.("", true);
+									inTextBlock = false;
+								}
+							} else {
+								content += part.text;
+								options?.onText?.(part.text, false);
+								inTextBlock = true;
+								if (inThinkingBlock) {
+									options?.onThinking?.("", true);
+									inThinkingBlock = false;
+								}
+							}
+						}
+
+						// Handle function calls
+						if (part.functionCall) {
+							if (inTextBlock) {
+								options?.onText?.("", true);
+								inTextBlock = false;
+							}
+							if (inThinkingBlock) {
+								options?.onThinking?.("", true);
+								inThinkingBlock = false;
+							}
+
+							toolCalls.push({
+								id: `call_${Date.now()}_${Math.random().toString(36).substr(2, 9)}`,
+								name: part.functionCall.name,
+								arguments: part.functionCall.args as Record<string, any>,
+							});
+						}
+					}
+				}
+
+				// Map finish reason
+				if (candidate?.finishReason) {
+					stopReason = this.mapStopReason(candidate.finishReason);
+				}
+			}
+
+			// Signal end of blocks
+			if (inTextBlock) {
+				options?.onText?.("", true);
+			}
+			if (inThinkingBlock) {
+				options?.onThinking?.("", true);
+			}
+
+			// Get final response for usage metadata
+			const response = await stream.response;
+			if (response.usageMetadata) {
+				usage = {
+					input: response.usageMetadata.promptTokenCount || 0,
+					output: response.usageMetadata.candidatesTokenCount || 0,
+					cacheRead: response.usageMetadata.cachedContentTokenCount || 0,
+					cacheWrite: 0,
+				};
+			}
+
+			return {
+				role: "assistant",
+				content: content || undefined,
+				thinking: thinking || undefined,
+				toolCalls: toolCalls.length > 0 ? toolCalls : undefined,
+				model: this.model,
+				usage,
+				stopReason,
+			};
+		} catch (error) {
+			return {
+				role: "assistant",
+				model: this.model,
+				usage: {
+					input: 0,
+					output: 0,
+					cacheRead: 0,
+					cacheWrite: 0,
+				},
+				stopReason: "error",
+				error: error instanceof Error ? error.message : String(error),
+			};
+		}
+	}
+
+	private convertMessages(messages: Message[]): any[] {
+		const contents: any[] = [];
+
+		for (const msg of messages) {
+			if (msg.role === "user") {
+				contents.push({
+					role: "user",
+					parts: [{ text: msg.content }],
+				});
+			} else if (msg.role === "assistant") {
+				const parts: any[] = [];
+
+				if (msg.content) {
+					parts.push({ text: msg.content });
+				}
+
+				if (msg.toolCalls) {
+					for (const toolCall of msg.toolCalls) {
+						parts.push({
+							functionCall: {
+								name: toolCall.name,
+								args: toolCall.arguments,
+							},
+						});
+					}
+				}
+
+				if (parts.length > 0) {
+					contents.push({
+						role: "model",
+						parts,
+					});
+				}
+			} else if (msg.role === "toolResult") {
+				// Tool results are sent as function responses
+				contents.push({
+					role: "user",
+					parts: [
+						{
+							functionResponse: {
+								name: msg.toolCallId.split("_")[1], // Extract function name from our ID format
+								response: {
+									result: msg.content,
+									isError: msg.isError || false,
+								},
+							},
+						},
+					],
+				});
+			}
+		}
+
+		return contents;
+	}
+
+	private convertTools(tools: Tool[]): any[] {
+		return [
+			{
+				functionDeclarations: tools.map((tool) => ({
+					name: tool.name,
+					description: tool.description,
+					parameters: tool.parameters,
+				})),
+			},
+		];
+	}
+
+	private mapToolChoice(choice: string): FunctionCallingMode {
+		switch (choice) {
+			case "auto":
+				return FunctionCallingMode.AUTO;
+			case "none":
+				return FunctionCallingMode.NONE;
+			case "any":
+				return FunctionCallingMode.ANY;
+			default:
+				return FunctionCallingMode.AUTO;
+		}
+	}
+
+	private mapStopReason(reason: string): StopReason {
+		switch (reason) {
+			case "STOP":
+				return "stop";
+			case "MAX_TOKENS":
+				return "length";
+			case "SAFETY":
+				return "safety";
+			case "RECITATION":
+				return "safety";
+			default:
+				return "stop";
+		}
+	}
+}
--- a/packages/ai/src/providers/openai-completions.ts
+++ b/packages/ai/src/providers/openai-completions.ts
@ -163,7 +163,7 @@ export class OpenAICompletionsLLM implements LLM<OpenAICompletionsLLMOptions> {
 				toolCalls: toolCalls.length > 0 ? toolCalls : undefined,
 				model: this.model,
 				usage,
-				stopResaon: this.mapStopReason(finishReason),
+				stopReason: this.mapStopReason(finishReason),
 			};
 		} catch (error) {
 			return {
@ -175,7 +175,7 @@ export class OpenAICompletionsLLM implements LLM<OpenAICompletionsLLMOptions> {
 					cacheRead: 0,
 					cacheWrite: 0,
 				},
-				stopResaon: "error",
+				stopReason: "error",
 				error: error instanceof Error ? error.message : String(error),
 			};
 		}
--- a/packages/ai/src/providers/openai-responses.ts
+++ b/packages/ai/src/providers/openai-responses.ts
@ -144,7 +144,7 @@ export class OpenAIResponsesLLM implements LLM<OpenAIResponsesLLMOptions> {
 						role: "assistant",
 						model: this.model,
 						usage,
-						stopResaon: "error",
+						stopReason: "error",
 						error: `Code ${event.code}: ${event.message}` || "Unknown error",
 					};
 				}
@ -158,7 +158,7 @@ export class OpenAIResponsesLLM implements LLM<OpenAIResponsesLLMOptions> {
 				toolCalls: toolCalls.length > 0 ? toolCalls : undefined,
 				model: this.model,
 				usage,
-				stopResaon: stopReason,
+				stopReason,
 			};
 		} catch (error) {
 			return {
@ -170,7 +170,7 @@ export class OpenAIResponsesLLM implements LLM<OpenAIResponsesLLMOptions> {
 					cacheRead: 0,
 					cacheWrite: 0,
 				},
-				stopResaon: "error",
+				stopReason: "error",
 				error: error instanceof Error ? error.message : String(error),
 			};
 		}
--- a/packages/ai/src/types.ts
+++ b/packages/ai/src/types.ts
@ -51,7 +51,7 @@ export interface AssistantMessage {
 	model: string;
 	usage: TokenUsage;

-	stopResaon: StopReason;
+	stopReason: StopReason;
 	error?: string | Error;
 }