mirror of
https://github.com/getcompanion-ai/co-mono.git
synced 2026-04-15 12:03:49 +00:00
refactor(ai): Implement unified model system with type-safe createLLM
- Add Model interface to types.ts with normalized structure - Create type-safe generic createLLM function with provider-specific model constraints - Generate models from OpenRouter API and models.dev data - Strip provider prefixes for direct providers (google, openai, anthropic, xai) - Keep full model IDs for OpenRouter-proxied models - Clean separation: types.ts (Model interface), models.ts (factory logic), models.generated.ts (data) - Remove old model scripts and unused dependencies - Rename GeminiLLM to GoogleLLM for consistency - Add tests for new providers (xAI, Groq, Cerebras, OpenRouter) - Support 181 tool-capable models across 7 providers with full type safety
This commit is contained in:
parent
3f36051bc6
commit
c7618db3f7
8 changed files with 409 additions and 418 deletions
|
|
@ -13,12 +13,12 @@ npm install @mariozechner/ai
|
|||
```typescript
|
||||
import { AnthropicLLM } from '@mariozechner/ai/providers/anthropic';
|
||||
import { OpenAICompletionsLLM } from '@mariozechner/ai/providers/openai-completions';
|
||||
import { GeminiLLM } from '@mariozechner/ai/providers/gemini';
|
||||
import { GoogleLLM } from '@mariozechner/ai/providers/gemini';
|
||||
|
||||
// Pick your provider - same API for all
|
||||
const llm = new AnthropicLLM('claude-sonnet-4-0');
|
||||
// const llm = new OpenAICompletionsLLM('gpt-5-mini');
|
||||
// const llm = new GeminiLLM('gemini-2.5-flash');
|
||||
// const llm = new GoogleLLM('gemini-2.5-flash');
|
||||
|
||||
// Basic completion
|
||||
const response = await llm.complete({
|
||||
|
|
|
|||
|
|
@ -11,15 +11,11 @@
|
|||
],
|
||||
"scripts": {
|
||||
"clean": "rm -rf dist",
|
||||
"models": "curl -s https://models.dev/api.json -o src/models.json",
|
||||
"generate-models": "npx tsx scripts/generate-models.ts",
|
||||
"build": "npm run generate-models && tsc -p tsconfig.build.json && cp src/models.json dist/models.json",
|
||||
"build": "npm run generate-models && tsc -p tsconfig.build.json",
|
||||
"check": "biome check --write .",
|
||||
"test": "vitest",
|
||||
"test:ui": "vitest --ui",
|
||||
"test:old": "npx tsx --test test/providers.test.ts",
|
||||
"extract-models": "npx tsx scripts/extract-openai-models.ts",
|
||||
"prepublishOnly": "npm run clean && npm run models && npm run build"
|
||||
"test": "vitest --run",
|
||||
"prepublishOnly": "npm run clean && npm run build"
|
||||
},
|
||||
"dependencies": {
|
||||
"@anthropic-ai/sdk": "^0.60.0",
|
||||
|
|
@ -48,7 +44,6 @@
|
|||
},
|
||||
"devDependencies": {
|
||||
"@types/node": "^24.3.0",
|
||||
"@vitest/ui": "^3.2.4",
|
||||
"vitest": "^3.2.4"
|
||||
}
|
||||
}
|
||||
|
|
|
|||
|
|
@ -3,263 +3,260 @@
|
|||
import { readFileSync, writeFileSync } from "fs";
|
||||
import { join } from "path";
|
||||
|
||||
// Load the models.json file
|
||||
const data = JSON.parse(readFileSync(join(process.cwd(), "src/models.json"), "utf-8"));
|
||||
|
||||
// Categorize providers by their API type
|
||||
const openaiModels: Record<string, any> = {};
|
||||
const openaiCompatibleProviders: Record<string, any> = {};
|
||||
const anthropicModels: Record<string, any> = {};
|
||||
const geminiModels: Record<string, any> = {};
|
||||
|
||||
for (const [providerId, provider] of Object.entries(data)) {
|
||||
const p = provider as any;
|
||||
|
||||
if (providerId === "openai") {
|
||||
// All OpenAI models use the Responses API
|
||||
openaiModels[providerId] = p;
|
||||
} else if (providerId === "anthropic" || providerId === "google-vertex-anthropic") {
|
||||
// Anthropic direct and via Vertex
|
||||
anthropicModels[providerId] = p;
|
||||
} else if (providerId === "google" || providerId === "google-vertex") {
|
||||
// Google Gemini models
|
||||
geminiModels[providerId] = p;
|
||||
} else if (p.npm === "@ai-sdk/openai-compatible" ||
|
||||
p.npm === "@ai-sdk/groq" ||
|
||||
p.npm === "@ai-sdk/cerebras" ||
|
||||
p.npm === "@ai-sdk/fireworks" ||
|
||||
p.npm === "@ai-sdk/openrouter" ||
|
||||
p.npm === "@ai-sdk/openai" && providerId !== "openai" ||
|
||||
p.api?.includes("/v1") ||
|
||||
["together", "ollama", "llama", "github-models", "groq", "cerebras", "openrouter", "fireworks"].includes(providerId)) {
|
||||
// OpenAI-compatible providers - they all speak the OpenAI completions API
|
||||
// Set default base URLs for known providers
|
||||
if (!p.api) {
|
||||
switch (providerId) {
|
||||
case "groq": p.api = "https://api.groq.com/openai/v1"; break;
|
||||
case "cerebras": p.api = "https://api.cerebras.com/v1"; break;
|
||||
case "together": p.api = "https://api.together.xyz/v1"; break;
|
||||
case "fireworks": p.api = "https://api.fireworks.ai/v1"; break;
|
||||
}
|
||||
}
|
||||
openaiCompatibleProviders[providerId] = p;
|
||||
}
|
||||
interface ModelsDevModel {
|
||||
id: string;
|
||||
name: string;
|
||||
tool_call?: boolean;
|
||||
reasoning?: boolean;
|
||||
limit?: {
|
||||
context?: number;
|
||||
output?: number;
|
||||
};
|
||||
cost?: {
|
||||
input?: number;
|
||||
output?: number;
|
||||
cache_read?: number;
|
||||
cache_write?: number;
|
||||
};
|
||||
modalities?: {
|
||||
input?: string[];
|
||||
};
|
||||
}
|
||||
|
||||
// Generate the TypeScript file
|
||||
let output = `// This file is auto-generated by scripts/generate-models.ts
|
||||
interface NormalizedModel {
|
||||
id: string;
|
||||
name: string;
|
||||
provider: string;
|
||||
reasoning: boolean;
|
||||
input: ("text" | "image")[];
|
||||
cost: {
|
||||
input: number;
|
||||
output: number;
|
||||
cacheRead: number;
|
||||
cacheWrite: number;
|
||||
};
|
||||
contextWindow: number;
|
||||
maxTokens: number;
|
||||
}
|
||||
|
||||
async function fetchOpenRouterModels(): Promise<NormalizedModel[]> {
|
||||
try {
|
||||
console.log("🌐 Fetching models from OpenRouter API...");
|
||||
const response = await fetch("https://openrouter.ai/api/v1/models");
|
||||
const data = await response.json();
|
||||
|
||||
const models: NormalizedModel[] = [];
|
||||
|
||||
for (const model of data.data) {
|
||||
// Only include models that support tools
|
||||
if (!model.supported_parameters?.includes("tools")) continue;
|
||||
|
||||
// Parse provider from model ID
|
||||
const [providerPrefix] = model.id.split("/");
|
||||
let provider = "";
|
||||
let modelKey = model.id;
|
||||
|
||||
// Map provider prefixes to our provider names
|
||||
if (model.id.startsWith("google/")) {
|
||||
provider = "google";
|
||||
modelKey = model.id.replace("google/", "");
|
||||
} else if (model.id.startsWith("openai/")) {
|
||||
provider = "openai";
|
||||
modelKey = model.id.replace("openai/", "");
|
||||
} else if (model.id.startsWith("anthropic/")) {
|
||||
provider = "anthropic";
|
||||
modelKey = model.id.replace("anthropic/", "");
|
||||
} else if (model.id.startsWith("x-ai/")) {
|
||||
provider = "xai";
|
||||
modelKey = model.id.replace("x-ai/", "");
|
||||
} else {
|
||||
// All other models go through OpenRouter
|
||||
provider = "openrouter";
|
||||
modelKey = model.id; // Keep full ID for OpenRouter
|
||||
}
|
||||
|
||||
// Skip if not one of our supported providers
|
||||
if (!["google", "openai", "anthropic", "xai", "openrouter"].includes(provider)) {
|
||||
continue;
|
||||
}
|
||||
|
||||
// Parse input modalities
|
||||
const input: ("text" | "image")[] = ["text"];
|
||||
if (model.architecture?.modality?.includes("image")) {
|
||||
input.push("image");
|
||||
}
|
||||
|
||||
// Convert pricing from $/token to $/million tokens
|
||||
const inputCost = parseFloat(model.pricing?.prompt || "0") * 1_000_000;
|
||||
const outputCost = parseFloat(model.pricing?.completion || "0") * 1_000_000;
|
||||
const cacheReadCost = parseFloat(model.pricing?.input_cache_read || "0") * 1_000_000;
|
||||
const cacheWriteCost = parseFloat(model.pricing?.input_cache_write || "0") * 1_000_000;
|
||||
|
||||
models.push({
|
||||
id: modelKey,
|
||||
name: model.name,
|
||||
provider,
|
||||
reasoning: model.supported_parameters?.includes("reasoning") || false,
|
||||
input,
|
||||
cost: {
|
||||
input: inputCost,
|
||||
output: outputCost,
|
||||
cacheRead: cacheReadCost,
|
||||
cacheWrite: cacheWriteCost,
|
||||
},
|
||||
contextWindow: model.context_length || 4096,
|
||||
maxTokens: model.top_provider?.max_completion_tokens || 4096,
|
||||
});
|
||||
}
|
||||
|
||||
console.log(`✅ Fetched ${models.length} tool-capable models from OpenRouter`);
|
||||
return models;
|
||||
} catch (error) {
|
||||
console.error("❌ Failed to fetch OpenRouter models:", error);
|
||||
return [];
|
||||
}
|
||||
}
|
||||
|
||||
function loadModelsDevData(): NormalizedModel[] {
|
||||
try {
|
||||
console.log("📁 Loading models from models.json...");
|
||||
const data = JSON.parse(readFileSync(join(process.cwd(), "src/models.json"), "utf-8"));
|
||||
|
||||
const models: NormalizedModel[] = [];
|
||||
|
||||
// Process Groq models
|
||||
if (data.groq?.models) {
|
||||
for (const [modelId, model] of Object.entries(data.groq.models)) {
|
||||
const m = model as ModelsDevModel;
|
||||
if (m.tool_call !== true) continue;
|
||||
|
||||
models.push({
|
||||
id: modelId,
|
||||
name: m.name || modelId,
|
||||
provider: "groq",
|
||||
reasoning: m.reasoning === true,
|
||||
input: m.modalities?.input?.includes("image") ? ["text", "image"] : ["text"],
|
||||
cost: {
|
||||
input: m.cost?.input || 0,
|
||||
output: m.cost?.output || 0,
|
||||
cacheRead: m.cost?.cache_read || 0,
|
||||
cacheWrite: m.cost?.cache_write || 0,
|
||||
},
|
||||
contextWindow: m.limit?.context || 4096,
|
||||
maxTokens: m.limit?.output || 4096,
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
// Process Cerebras models
|
||||
if (data.cerebras?.models) {
|
||||
for (const [modelId, model] of Object.entries(data.cerebras.models)) {
|
||||
const m = model as ModelsDevModel;
|
||||
if (m.tool_call !== true) continue;
|
||||
|
||||
models.push({
|
||||
id: modelId,
|
||||
name: m.name || modelId,
|
||||
provider: "cerebras",
|
||||
reasoning: m.reasoning === true,
|
||||
input: m.modalities?.input?.includes("image") ? ["text", "image"] : ["text"],
|
||||
cost: {
|
||||
input: m.cost?.input || 0,
|
||||
output: m.cost?.output || 0,
|
||||
cacheRead: m.cost?.cache_read || 0,
|
||||
cacheWrite: m.cost?.cache_write || 0,
|
||||
},
|
||||
contextWindow: m.limit?.context || 4096,
|
||||
maxTokens: m.limit?.output || 4096,
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
console.log(`✅ Loaded ${models.length} tool-capable models from models.dev`);
|
||||
return models;
|
||||
} catch (error) {
|
||||
console.error("❌ Failed to load models.dev data:", error);
|
||||
return [];
|
||||
}
|
||||
}
|
||||
|
||||
async function generateModels() {
|
||||
// Fetch all models
|
||||
const openRouterModels = await fetchOpenRouterModels();
|
||||
const modelsDevModels = loadModelsDevData();
|
||||
|
||||
// Combine models (models.dev takes priority for Groq/Cerebras)
|
||||
const allModels = [...modelsDevModels, ...openRouterModels];
|
||||
|
||||
// Group by provider
|
||||
const providers: Record<string, NormalizedModel[]> = {};
|
||||
for (const model of allModels) {
|
||||
if (!providers[model.provider]) {
|
||||
providers[model.provider] = [];
|
||||
}
|
||||
providers[model.provider].push(model);
|
||||
}
|
||||
|
||||
// Generate TypeScript file
|
||||
let output = `// This file is auto-generated by scripts/generate-models.ts
|
||||
// Do not edit manually - run 'npm run generate-models' to update
|
||||
|
||||
import type { ModalityInput, ModalityOutput } from "./models.js";
|
||||
|
||||
export interface ModelData {
|
||||
id: string;
|
||||
name: string;
|
||||
reasoning: boolean;
|
||||
tool_call: boolean;
|
||||
attachment: boolean;
|
||||
temperature: boolean;
|
||||
knowledge?: string;
|
||||
release_date: string;
|
||||
last_updated: string;
|
||||
modalities: {
|
||||
input: ModalityInput[];
|
||||
output: ModalityOutput[];
|
||||
};
|
||||
open_weights: boolean;
|
||||
limit: {
|
||||
context: number;
|
||||
output: number;
|
||||
};
|
||||
cost?: {
|
||||
input: number;
|
||||
output: number;
|
||||
cache_read?: number;
|
||||
cache_write?: number;
|
||||
};
|
||||
}
|
||||
|
||||
export interface ProviderData {
|
||||
id: string;
|
||||
name: string;
|
||||
baseUrl?: string;
|
||||
env?: string[];
|
||||
models: Record<string, ModelData>;
|
||||
}
|
||||
import type { Model } from "./types.js";
|
||||
|
||||
export const PROVIDERS = {
|
||||
`;
|
||||
|
||||
// Generate OpenAI models
|
||||
output += `// OpenAI models - all use OpenAIResponsesLLM\n`;
|
||||
output += `export const OPENAI_MODELS = {\n`;
|
||||
for (const [providerId, provider] of Object.entries(openaiModels)) {
|
||||
const p = provider as any;
|
||||
for (const [modelId, model] of Object.entries(p.models || {})) {
|
||||
const m = model as any;
|
||||
output += ` "${modelId}": ${JSON.stringify(m, null, 8).split('\n').join('\n ')},\n`;
|
||||
}
|
||||
}
|
||||
output += `} as const;\n\n`;
|
||||
// Generate provider sections
|
||||
for (const [providerId, models] of Object.entries(providers)) {
|
||||
output += `\t${providerId}: {\n`;
|
||||
output += `\t\tmodels: {\n`;
|
||||
|
||||
// Generate OpenAI-compatible providers
|
||||
output += `// OpenAI-compatible providers - use OpenAICompletionsLLM\n`;
|
||||
output += `export const OPENAI_COMPATIBLE_PROVIDERS = {\n`;
|
||||
for (const [providerId, provider] of Object.entries(openaiCompatibleProviders)) {
|
||||
const p = provider as any;
|
||||
output += ` "${providerId}": {\n`;
|
||||
output += ` id: "${providerId}",\n`;
|
||||
output += ` name: "${p.name}",\n`;
|
||||
if (p.api) {
|
||||
output += ` baseUrl: "${p.api}",\n`;
|
||||
}
|
||||
if (p.env) {
|
||||
output += ` env: ${JSON.stringify(p.env)},\n`;
|
||||
}
|
||||
output += ` models: {\n`;
|
||||
for (const [modelId, model] of Object.entries(p.models || {})) {
|
||||
const m = model as any;
|
||||
output += ` "${modelId}": ${JSON.stringify(m, null, 12).split('\n').join('\n ')},\n`;
|
||||
}
|
||||
output += ` }\n`;
|
||||
output += ` },\n`;
|
||||
}
|
||||
output += `} as const;\n\n`;
|
||||
for (const model of models) {
|
||||
output += `\t\t\t"${model.id}": {\n`;
|
||||
output += `\t\t\t\tid: "${model.id}",\n`;
|
||||
output += `\t\t\t\tname: "${model.name}",\n`;
|
||||
output += `\t\t\t\tprovider: "${model.provider}",\n`;
|
||||
output += `\t\t\t\treasoning: ${model.reasoning},\n`;
|
||||
output += `\t\t\t\tinput: ${JSON.stringify(model.input)},\n`;
|
||||
output += `\t\t\t\tcost: {\n`;
|
||||
output += `\t\t\t\t\tinput: ${model.cost.input},\n`;
|
||||
output += `\t\t\t\t\toutput: ${model.cost.output},\n`;
|
||||
output += `\t\t\t\t\tcacheRead: ${model.cost.cacheRead},\n`;
|
||||
output += `\t\t\t\t\tcacheWrite: ${model.cost.cacheWrite},\n`;
|
||||
output += `\t\t\t\t},\n`;
|
||||
output += `\t\t\t\tcontextWindow: ${model.contextWindow},\n`;
|
||||
output += `\t\t\t\tmaxTokens: ${model.maxTokens},\n`;
|
||||
output += `\t\t\t} satisfies Model,\n`;
|
||||
}
|
||||
|
||||
// Generate Anthropic models (avoiding duplicates)
|
||||
output += `// Anthropic models - use AnthropicLLM\n`;
|
||||
output += `export const ANTHROPIC_MODELS = {\n`;
|
||||
const seenAnthropicModels = new Set<string>();
|
||||
for (const [providerId, provider] of Object.entries(anthropicModels)) {
|
||||
const p = provider as any;
|
||||
for (const [modelId, model] of Object.entries(p.models || {})) {
|
||||
if (!seenAnthropicModels.has(modelId)) {
|
||||
seenAnthropicModels.add(modelId);
|
||||
const m = model as any;
|
||||
output += ` "${modelId}": ${JSON.stringify(m, null, 8).split('\n').join('\n ')},\n`;
|
||||
}
|
||||
}
|
||||
}
|
||||
output += `} as const;\n\n`;
|
||||
output += `\t\t}\n`;
|
||||
output += `\t},\n`;
|
||||
}
|
||||
|
||||
// Generate Gemini models (avoiding duplicates)
|
||||
output += `// Gemini models - use GeminiLLM\n`;
|
||||
output += `export const GEMINI_MODELS = {\n`;
|
||||
const seenGeminiModels = new Set<string>();
|
||||
for (const [providerId, provider] of Object.entries(geminiModels)) {
|
||||
const p = provider as any;
|
||||
for (const [modelId, model] of Object.entries(p.models || {})) {
|
||||
if (!seenGeminiModels.has(modelId)) {
|
||||
seenGeminiModels.add(modelId);
|
||||
const m = model as any;
|
||||
output += ` "${modelId}": ${JSON.stringify(m, null, 8).split('\n').join('\n ')},\n`;
|
||||
}
|
||||
}
|
||||
}
|
||||
output += `} as const;\n\n`;
|
||||
output += `} as const;
|
||||
|
||||
// Generate type helpers
|
||||
output += `// Type helpers\n`;
|
||||
output += `export type OpenAIModel = keyof typeof OPENAI_MODELS;\n`;
|
||||
output += `export type OpenAICompatibleProvider = keyof typeof OPENAI_COMPATIBLE_PROVIDERS;\n`;
|
||||
output += `export type AnthropicModel = keyof typeof ANTHROPIC_MODELS;\n`;
|
||||
output += `export type GeminiModel = keyof typeof GEMINI_MODELS;\n\n`;
|
||||
|
||||
// Generate the factory function
|
||||
output += `// Factory function implementation\n`;
|
||||
output += `import { OpenAIResponsesLLM } from "./providers/openai-responses.js";\n`;
|
||||
output += `import { OpenAICompletionsLLM } from "./providers/openai-completions.js";\n`;
|
||||
output += `import { AnthropicLLM } from "./providers/anthropic.js";\n`;
|
||||
output += `import { GeminiLLM } from "./providers/gemini.js";\n`;
|
||||
output += `import type { LLM, LLMOptions } from "./types.js";\n\n`;
|
||||
|
||||
output += `export interface CreateLLMOptions {
|
||||
apiKey?: string;
|
||||
baseUrl?: string;
|
||||
}
|
||||
|
||||
// Overloads for type safety
|
||||
export function createLLM(
|
||||
provider: "openai",
|
||||
model: OpenAIModel,
|
||||
options?: CreateLLMOptions
|
||||
): OpenAIResponsesLLM;
|
||||
|
||||
export function createLLM(
|
||||
provider: OpenAICompatibleProvider,
|
||||
model: string, // We'll validate at runtime
|
||||
options?: CreateLLMOptions
|
||||
): OpenAICompletionsLLM;
|
||||
|
||||
export function createLLM(
|
||||
provider: "anthropic",
|
||||
model: AnthropicModel,
|
||||
options?: CreateLLMOptions
|
||||
): AnthropicLLM;
|
||||
|
||||
export function createLLM(
|
||||
provider: "gemini",
|
||||
model: GeminiModel,
|
||||
options?: CreateLLMOptions
|
||||
): GeminiLLM;
|
||||
|
||||
// Implementation
|
||||
export function createLLM(
|
||||
provider: string,
|
||||
model: string,
|
||||
options?: CreateLLMOptions
|
||||
): LLM<LLMOptions> {
|
||||
const apiKey = options?.apiKey || process.env[getEnvVar(provider)];
|
||||
|
||||
if (provider === "openai") {
|
||||
return new OpenAIResponsesLLM(model, apiKey);
|
||||
}
|
||||
|
||||
if (provider === "anthropic") {
|
||||
return new AnthropicLLM(model, apiKey);
|
||||
}
|
||||
|
||||
if (provider === "gemini") {
|
||||
return new GeminiLLM(model, apiKey);
|
||||
}
|
||||
|
||||
// OpenAI-compatible providers
|
||||
if (provider in OPENAI_COMPATIBLE_PROVIDERS) {
|
||||
const providerData = OPENAI_COMPATIBLE_PROVIDERS[provider as OpenAICompatibleProvider];
|
||||
const baseUrl = options?.baseUrl || providerData.baseUrl;
|
||||
return new OpenAICompletionsLLM(model, apiKey, baseUrl);
|
||||
}
|
||||
|
||||
throw new Error(\`Unknown provider: \${provider}\`);
|
||||
}
|
||||
|
||||
// Helper to get the default environment variable for a provider
|
||||
function getEnvVar(provider: string): string {
|
||||
switch (provider) {
|
||||
case "openai": return "OPENAI_API_KEY";
|
||||
case "anthropic": return "ANTHROPIC_API_KEY";
|
||||
case "gemini": return "GEMINI_API_KEY";
|
||||
case "groq": return "GROQ_API_KEY";
|
||||
case "cerebras": return "CEREBRAS_API_KEY";
|
||||
case "together": return "TOGETHER_API_KEY";
|
||||
case "openrouter": return "OPENROUTER_API_KEY";
|
||||
default: return \`\${provider.toUpperCase()}_API_KEY\`;
|
||||
}
|
||||
}
|
||||
// Helper type to extract models for each provider
|
||||
export type ProviderModels = {
|
||||
[K in keyof typeof PROVIDERS]: typeof PROVIDERS[K]["models"]
|
||||
};
|
||||
`;
|
||||
|
||||
// Write the generated file
|
||||
writeFileSync(join(process.cwd(), "src/models.generated.ts"), output);
|
||||
console.log("✅ Generated src/models.generated.ts");
|
||||
// Write file
|
||||
writeFileSync(join(process.cwd(), "src/models.generated.ts"), output);
|
||||
console.log("✅ Generated src/models.generated.ts");
|
||||
|
||||
// Count statistics
|
||||
const openaiCount = Object.values(openaiModels).reduce((acc, p: any) => acc + Object.keys(p.models || {}).length, 0);
|
||||
const compatCount = Object.values(openaiCompatibleProviders).reduce((acc, p: any) => acc + Object.keys(p.models || {}).length, 0);
|
||||
const anthropicCount = Object.values(anthropicModels).reduce((acc, p: any) => acc + Object.keys(p.models || {}).length, 0);
|
||||
const geminiCount = Object.values(geminiModels).reduce((acc, p: any) => acc + Object.keys(p.models || {}).length, 0);
|
||||
// Print statistics
|
||||
const totalModels = allModels.length;
|
||||
const reasoningModels = allModels.filter(m => m.reasoning).length;
|
||||
|
||||
console.log(`\nModel counts:`);
|
||||
console.log(` OpenAI (Responses API): ${openaiCount} models`);
|
||||
console.log(` OpenAI-compatible: ${compatCount} models across ${Object.keys(openaiCompatibleProviders).length} providers`);
|
||||
console.log(` Anthropic: ${anthropicCount} models`);
|
||||
console.log(` Gemini: ${geminiCount} models`);
|
||||
console.log(` Total: ${openaiCount + compatCount + anthropicCount + geminiCount} models`);
|
||||
console.log(`\n📊 Model Statistics:`);
|
||||
console.log(` Total tool-capable models: ${totalModels}`);
|
||||
console.log(` Reasoning-capable models: ${reasoningModels}`);
|
||||
|
||||
for (const [provider, models] of Object.entries(providers)) {
|
||||
console.log(` ${provider}: ${models.length} models`);
|
||||
}
|
||||
}
|
||||
|
||||
// Run the generator
|
||||
generateModels().catch(console.error);
|
||||
|
|
@ -3,41 +3,30 @@
|
|||
|
||||
export const version = "0.5.8";
|
||||
|
||||
// Export generated models and factory
|
||||
// Export generated models data
|
||||
export { PROVIDERS } from "./models.generated.js";
|
||||
|
||||
// Export models utilities and types
|
||||
export {
|
||||
ANTHROPIC_MODELS,
|
||||
type AnthropicModel,
|
||||
type CreateLLMOptions,
|
||||
type CerebrasModel,
|
||||
createLLM,
|
||||
GEMINI_MODELS,
|
||||
type GeminiModel,
|
||||
type ModelData,
|
||||
OPENAI_COMPATIBLE_PROVIDERS,
|
||||
OPENAI_MODELS,
|
||||
type OpenAICompatibleProvider,
|
||||
type GoogleModel,
|
||||
type GroqModel,
|
||||
type Model,
|
||||
type OpenAIModel,
|
||||
type ProviderData,
|
||||
} from "./models.generated.js";
|
||||
// Export models utilities
|
||||
export {
|
||||
getAllProviders,
|
||||
getModelInfo,
|
||||
getProviderInfo,
|
||||
getProviderModels,
|
||||
loadModels,
|
||||
type ModalityInput,
|
||||
type ModalityOutput,
|
||||
type ModelInfo,
|
||||
type ModelsData,
|
||||
type ProviderInfo,
|
||||
supportsThinking,
|
||||
supportsTools,
|
||||
type OpenRouterModel,
|
||||
PROVIDER_CONFIG,
|
||||
type ProviderModels,
|
||||
type ProviderToLLM,
|
||||
type XAIModel,
|
||||
} from "./models.js";
|
||||
|
||||
// Export providers
|
||||
export { AnthropicLLM } from "./providers/anthropic.js";
|
||||
export { GeminiLLM } from "./providers/gemini.js";
|
||||
export { GoogleLLM } from "./providers/gemini.js";
|
||||
export { OpenAICompletionsLLM } from "./providers/openai-completions.js";
|
||||
export { OpenAIResponsesLLM } from "./providers/openai-responses.js";
|
||||
|
||||
// Export types
|
||||
export type * from "./types.js";
|
||||
|
|
|
|||
|
|
@ -1,133 +1,97 @@
|
|||
import { readFileSync } from "fs";
|
||||
import { dirname, join } from "path";
|
||||
import { fileURLToPath } from "url";
|
||||
import { PROVIDERS } from "./models.generated.js";
|
||||
import { AnthropicLLM } from "./providers/anthropic.js";
|
||||
import { GoogleLLM } from "./providers/gemini.js";
|
||||
import { OpenAICompletionsLLM } from "./providers/openai-completions.js";
|
||||
import { OpenAIResponsesLLM } from "./providers/openai-responses.js";
|
||||
import type { Model } from "./types.js";
|
||||
|
||||
export type ModalityInput = "text" | "image" | "audio" | "video" | "pdf";
|
||||
export type ModalityOutput = "text" | "image" | "audio";
|
||||
// Provider configuration with factory functions
|
||||
export const PROVIDER_CONFIG = {
|
||||
google: {
|
||||
envKey: "GEMINI_API_KEY",
|
||||
create: (model: string, apiKey: string) => new GoogleLLM(model, apiKey),
|
||||
},
|
||||
openai: {
|
||||
envKey: "OPENAI_API_KEY",
|
||||
create: (model: string, apiKey: string) => new OpenAIResponsesLLM(model, apiKey),
|
||||
},
|
||||
anthropic: {
|
||||
envKey: "ANTHROPIC_API_KEY",
|
||||
create: (model: string, apiKey: string) => new AnthropicLLM(model, apiKey),
|
||||
},
|
||||
xai: {
|
||||
envKey: "XAI_API_KEY",
|
||||
create: (model: string, apiKey: string) => new OpenAICompletionsLLM(model, apiKey, "https://api.x.ai/v1"),
|
||||
},
|
||||
groq: {
|
||||
envKey: "GROQ_API_KEY",
|
||||
create: (model: string, apiKey: string) =>
|
||||
new OpenAICompletionsLLM(model, apiKey, "https://api.groq.com/openai/v1"),
|
||||
},
|
||||
cerebras: {
|
||||
envKey: "CEREBRAS_API_KEY",
|
||||
create: (model: string, apiKey: string) => new OpenAICompletionsLLM(model, apiKey, "https://api.cerebras.ai/v1"),
|
||||
},
|
||||
openrouter: {
|
||||
envKey: "OPENROUTER_API_KEY",
|
||||
create: (model: string, apiKey: string) =>
|
||||
new OpenAICompletionsLLM(model, apiKey, "https://openrouter.ai/api/v1"),
|
||||
},
|
||||
} as const;
|
||||
|
||||
export interface ModelInfo {
|
||||
id: string;
|
||||
name: string;
|
||||
attachment: boolean;
|
||||
reasoning: boolean;
|
||||
temperature: boolean;
|
||||
tool_call: boolean;
|
||||
release_date: string;
|
||||
last_updated: string;
|
||||
modalities: {
|
||||
input: ModalityInput[];
|
||||
output: ModalityOutput[];
|
||||
};
|
||||
open_weights: boolean;
|
||||
limit: {
|
||||
context: number;
|
||||
output: number;
|
||||
};
|
||||
knowledge?: string; // Optional - knowledge cutoff date
|
||||
cost?: {
|
||||
input: number;
|
||||
output: number;
|
||||
cache_read?: number;
|
||||
cache_write?: number;
|
||||
};
|
||||
// Type mapping from provider to LLM implementation
|
||||
export type ProviderToLLM = {
|
||||
google: GoogleLLM;
|
||||
openai: OpenAIResponsesLLM;
|
||||
anthropic: AnthropicLLM;
|
||||
xai: OpenAICompletionsLLM;
|
||||
groq: OpenAICompletionsLLM;
|
||||
cerebras: OpenAICompletionsLLM;
|
||||
openrouter: OpenAICompletionsLLM;
|
||||
};
|
||||
|
||||
// Extract model types for each provider
|
||||
export type GoogleModel = keyof typeof PROVIDERS.google.models;
|
||||
export type OpenAIModel = keyof typeof PROVIDERS.openai.models;
|
||||
export type AnthropicModel = keyof typeof PROVIDERS.anthropic.models;
|
||||
export type XAIModel = keyof typeof PROVIDERS.xai.models;
|
||||
export type GroqModel = keyof typeof PROVIDERS.groq.models;
|
||||
export type CerebrasModel = keyof typeof PROVIDERS.cerebras.models;
|
||||
export type OpenRouterModel = keyof typeof PROVIDERS.openrouter.models;
|
||||
|
||||
// Map providers to their model types
|
||||
export type ProviderModels = {
|
||||
google: GoogleModel;
|
||||
openai: OpenAIModel;
|
||||
anthropic: AnthropicModel;
|
||||
xai: XAIModel;
|
||||
groq: GroqModel;
|
||||
cerebras: CerebrasModel;
|
||||
openrouter: OpenRouterModel;
|
||||
};
|
||||
|
||||
// Single generic factory function
|
||||
export function createLLM<P extends keyof typeof PROVIDERS, M extends keyof (typeof PROVIDERS)[P]["models"]>(
|
||||
provider: P,
|
||||
model: M,
|
||||
apiKey?: string,
|
||||
): ProviderToLLM[P] {
|
||||
const config = PROVIDER_CONFIG[provider as keyof typeof PROVIDER_CONFIG];
|
||||
if (!config) throw new Error(`Unknown provider: ${provider}`);
|
||||
|
||||
const providerData = PROVIDERS[provider];
|
||||
if (!providerData) throw new Error(`Unknown provider: ${provider}`);
|
||||
|
||||
// Type-safe model lookup
|
||||
const models = providerData.models as Record<string, Model>;
|
||||
const modelData = models[model as string];
|
||||
if (!modelData) throw new Error(`Unknown model: ${String(model)} for provider ${provider}`);
|
||||
|
||||
const key = apiKey || process.env[config.envKey];
|
||||
if (!key) throw new Error(`No API key provided for ${provider}. Set ${config.envKey} or pass apiKey.`);
|
||||
|
||||
return config.create(model as string, key) as ProviderToLLM[P];
|
||||
}
|
||||
|
||||
export interface ProviderInfo {
|
||||
id: string;
|
||||
env?: string[];
|
||||
npm?: string;
|
||||
api?: string;
|
||||
name: string;
|
||||
doc?: string;
|
||||
models: Record<string, ModelInfo>;
|
||||
}
|
||||
|
||||
export type ModelsData = Record<string, ProviderInfo>;
|
||||
|
||||
let cachedModels: ModelsData | null = null;
|
||||
|
||||
/**
|
||||
* Load models data from models.json
|
||||
* The file is loaded relative to this module's location
|
||||
*/
|
||||
export function loadModels(): ModelsData {
|
||||
if (cachedModels) {
|
||||
return cachedModels;
|
||||
}
|
||||
|
||||
try {
|
||||
// Get the directory of this module
|
||||
const currentDir = dirname(fileURLToPath(import.meta.url));
|
||||
const modelsPath = join(currentDir, "models.json");
|
||||
|
||||
const data = readFileSync(modelsPath, "utf-8");
|
||||
cachedModels = JSON.parse(data);
|
||||
return cachedModels!;
|
||||
} catch (error) {
|
||||
console.error("Failed to load models.json:", error);
|
||||
// Return empty providers object as fallback
|
||||
return {};
|
||||
}
|
||||
}
|
||||
|
||||
/**
|
||||
* Get information about a specific model
|
||||
*/
|
||||
export function getModelInfo(modelId: string): ModelInfo | undefined {
|
||||
const data = loadModels();
|
||||
|
||||
// Search through all providers
|
||||
for (const provider of Object.values(data)) {
|
||||
if (provider.models && provider.models[modelId]) {
|
||||
return provider.models[modelId];
|
||||
}
|
||||
}
|
||||
|
||||
return undefined;
|
||||
}
|
||||
|
||||
/**
|
||||
* Get all models for a specific provider
|
||||
*/
|
||||
export function getProviderModels(providerId: string): ModelInfo[] {
|
||||
const data = loadModels();
|
||||
const provider = data[providerId];
|
||||
|
||||
if (!provider || !provider.models) {
|
||||
return [];
|
||||
}
|
||||
|
||||
return Object.values(provider.models);
|
||||
}
|
||||
|
||||
/**
|
||||
* Get provider information
|
||||
*/
|
||||
export function getProviderInfo(providerId: string): ProviderInfo | undefined {
|
||||
const data = loadModels();
|
||||
return data[providerId];
|
||||
}
|
||||
|
||||
/**
|
||||
* Check if a model supports thinking/reasoning
|
||||
*/
|
||||
export function supportsThinking(modelId: string): boolean {
|
||||
const model = getModelInfo(modelId);
|
||||
return model?.reasoning === true;
|
||||
}
|
||||
|
||||
/**
|
||||
* Check if a model supports tool calling
|
||||
*/
|
||||
export function supportsTools(modelId: string): boolean {
|
||||
const model = getModelInfo(modelId);
|
||||
return model?.tool_call === true;
|
||||
}
|
||||
|
||||
/**
|
||||
* Get all available providers
|
||||
*/
|
||||
export function getAllProviders(): ProviderInfo[] {
|
||||
const data = loadModels();
|
||||
return Object.values(data);
|
||||
}
|
||||
// Re-export Model type for convenience
|
||||
export type { Model };
|
||||
|
|
|
|||
|
|
@ -17,7 +17,7 @@ import type {
|
|||
ToolCall,
|
||||
} from "../types.js";
|
||||
|
||||
export interface GeminiLLMOptions extends LLMOptions {
|
||||
export interface GoogleLLMOptions extends LLMOptions {
|
||||
toolChoice?: "auto" | "none" | "any";
|
||||
thinking?: {
|
||||
enabled: boolean;
|
||||
|
|
@ -25,7 +25,7 @@ export interface GeminiLLMOptions extends LLMOptions {
|
|||
};
|
||||
}
|
||||
|
||||
export class GeminiLLM implements LLM<GeminiLLMOptions> {
|
||||
export class GoogleLLM implements LLM<GoogleLLMOptions> {
|
||||
private client: GoogleGenAI;
|
||||
private model: string;
|
||||
|
||||
|
|
@ -42,7 +42,7 @@ export class GeminiLLM implements LLM<GeminiLLMOptions> {
|
|||
this.model = model;
|
||||
}
|
||||
|
||||
async complete(context: Context, options?: GeminiLLMOptions): Promise<AssistantMessage> {
|
||||
async complete(context: Context, options?: GoogleLLMOptions): Promise<AssistantMessage> {
|
||||
try {
|
||||
const contents = this.convertMessages(context.messages);
|
||||
|
||||
|
|
|
|||
|
|
@ -106,3 +106,20 @@ export interface TokenUsage {
|
|||
}
|
||||
|
||||
export type StopReason = "stop" | "length" | "toolUse" | "safety" | "error";
|
||||
|
||||
// Model interface for the unified model system
|
||||
export interface Model {
|
||||
id: string;
|
||||
name: string;
|
||||
provider: string;
|
||||
reasoning: boolean;
|
||||
input: ("text" | "image")[];
|
||||
cost: {
|
||||
input: number; // $/million tokens
|
||||
output: number; // $/million tokens
|
||||
cacheRead: number; // $/million tokens
|
||||
cacheWrite: number; // $/million tokens
|
||||
};
|
||||
contextWindow: number;
|
||||
maxTokens: number;
|
||||
}
|
||||
|
|
|
|||
|
|
@ -1,10 +1,11 @@
|
|||
import { describe, it, beforeAll, afterAll, expect } from "vitest";
|
||||
import { GeminiLLM } from "../src/providers/gemini.js";
|
||||
import { GoogleLLM } from "../src/providers/gemini.js";
|
||||
import { OpenAICompletionsLLM } from "../src/providers/openai-completions.js";
|
||||
import { OpenAIResponsesLLM } from "../src/providers/openai-responses.js";
|
||||
import { AnthropicLLM } from "../src/providers/anthropic.js";
|
||||
import type { LLM, LLMOptions, Context, Tool, AssistantMessage } from "../src/types.js";
|
||||
import { spawn, ChildProcess, execSync } from "child_process";
|
||||
import { createLLM } from "../src/models.js";
|
||||
|
||||
// Calculator tool definition (same as examples)
|
||||
const calculatorTool: Tool = {
|
||||
|
|
@ -213,10 +214,10 @@ async function multiTurn<T extends LLMOptions>(llm: LLM<T>, thinkingOptions: T)
|
|||
|
||||
describe("AI Providers E2E Tests", () => {
|
||||
describe.skipIf(!process.env.GEMINI_API_KEY)("Gemini Provider", () => {
|
||||
let llm: GeminiLLM;
|
||||
let llm: GoogleLLM;
|
||||
|
||||
beforeAll(() => {
|
||||
llm = new GeminiLLM("gemini-2.5-flash", process.env.GEMINI_API_KEY!);
|
||||
llm = new GoogleLLM("gemini-2.5-flash", process.env.GEMINI_API_KEY!);
|
||||
});
|
||||
|
||||
it("should complete basic text generation", async () => {
|
||||
|
|
@ -316,11 +317,11 @@ describe("AI Providers E2E Tests", () => {
|
|||
});
|
||||
});
|
||||
|
||||
describe.skipIf(!process.env.GROK_API_KEY)("Grok Provider (via OpenAI Completions)", () => {
|
||||
describe.skipIf(!process.env.XAI_API_KEY)("xAI Provider (via OpenAI Completions)", () => {
|
||||
let llm: OpenAICompletionsLLM;
|
||||
|
||||
beforeAll(() => {
|
||||
llm = new OpenAICompletionsLLM("grok-code-fast-1", process.env.GROK_API_KEY!, "https://api.x.ai/v1");
|
||||
llm = new OpenAICompletionsLLM("grok-code-fast-1", process.env.XAI_API_KEY!, "https://api.x.ai/v1");
|
||||
});
|
||||
|
||||
it("should complete basic text generation", async () => {
|
||||
|
|
@ -509,4 +510,32 @@ describe("AI Providers E2E Tests", () => {
|
|||
await multiTurn(llm, {reasoningEffort: "medium"});
|
||||
});
|
||||
});
|
||||
|
||||
describe.skipIf(!process.env.OPENROUTER_API_KEY)("OpenRouter Provider (Kimi K2)", () => {
|
||||
let llm: OpenAICompletionsLLM;
|
||||
|
||||
beforeAll(() => {
|
||||
llm = createLLM("openrouter", "moonshotai/kimi-k2", process.env.OPENROUTER_API_KEY!);
|
||||
});
|
||||
|
||||
it("should complete basic text generation", async () => {
|
||||
await basicTextGeneration(llm);
|
||||
});
|
||||
|
||||
it("should handle tool calling", async () => {
|
||||
await handleToolCall(llm);
|
||||
});
|
||||
|
||||
it("should handle streaming", async () => {
|
||||
await handleStreaming(llm);
|
||||
});
|
||||
|
||||
it("should handle thinking mode", async () => {
|
||||
await handleThinking(llm, {reasoningEffort: "medium"}, false);
|
||||
});
|
||||
|
||||
it("should handle multi-turn with thinking and tools", async () => {
|
||||
await multiTurn(llm, {reasoningEffort: "medium"});
|
||||
});
|
||||
});
|
||||
});
|
||||
Loading…
Add table
Add a link
Reference in a new issue