co-mono/packages/ai/test/image-limits.test.ts
Mario Zechner 19f3c23f6d Fix PR #689: Add changelog attribution, coding-agent changelog, fix test types, add provider to test suites
- Fix ai/CHANGELOG.md: add PR link and author attribution
- Add coding-agent/CHANGELOG.md entry for vercel-ai-gateway provider
- Fix model-resolver.test.ts: use anthropic-messages API type to match generated models
- Add vercel-ai-gateway to test suites: tokens, abort, empty, context-overflow, unicode-surrogate, tool-call-without-result, image-tool-result, total-tokens, image-limits
2026-01-13 16:46:00 +01:00

1269 lines
44 KiB
TypeScript

/**
* Image limits test suite
*
* Tests provider-specific image limitations:
* - Maximum number of images in a context (with small 100x100 images)
* - Maximum image size (bytes)
* - Maximum image dimensions
* - Maximum payload (realistic large images stress test)
*
* ============================================================================
* DISCOVERED LIMITS (Dec 2025):
* ============================================================================
*
* BASIC LIMITS (small images):
* | Provider | Model | Max Images | Max Size | Max Dim |
* |-------------|--------------------|------------|----------|----------|
* | Anthropic | claude-3-5-haiku | 100 | 5MB | 8000px |
* | OpenAI | gpt-4o-mini | 500 | ≥25MB | ≥20000px |
* | Gemini | gemini-2.5-flash | ~2000* | ≥40MB | 8000px |
* | Mistral | pixtral-12b | 8 | ~15MB | 8000px |
* | xAI | grok-2-vision | ≥100 | 25MB | 8000px |
* | Groq | llama-4-scout-17b | 5 | ~5MB | ~5760px**|
* | zAI | glm-4.5v | *** | ≥20MB | 8000px |
* | OpenRouter | z-ai/glm-4.5v | *** | ~10MB | ≥20000px |
*
* REALISTIC PAYLOAD LIMITS (large images):
* | Provider | Image Size | Max Count | Total Payload | Limit Hit |
* |-------------|------------|-----------|---------------|---------------------|
* | Anthropic | ~3MB | 6 | ~18MB | Request too large |
* | OpenAI | ~15MB | 2 | ~30MB | Generic error |
* | Gemini | ~20MB | 10 | ~200MB | String length |
* | Mistral | ~10MB | 4 | ~40MB | 413 Payload too large|
* | xAI | ~20MB | 1 | ~20MB | 413 Entity too large|
* | Groq | 5760px | 5 | N/A | 5 image limit |
* | zAI | ~15MB | 2 | ~30MB | 50MB request limit |
* | OpenRouter | ~5MB | 2 | ~10MB | Provider error |
*
* Notes:
* - Anthropic: 100 image hard limit, 5MB per image, but ~18MB total request
* limit in practice (32MB documented but hit limit at ~24MB).
* - OpenAI: 500 image limit but total payload limited to ~30-45MB.
* - Gemini: * Very permissive. 10 x 20MB = 200MB worked!
* - Mistral: 8 images max, ~40MB total payload.
* - xAI: 25MB per image but strict request size limit (~20MB total).
* - Groq: ** Most restrictive. 5 images max, 33177600 pixels max (≈5760x5760).
* - zAI: 50MB request limit (explicit in error message).
* - OpenRouter: *** Context-window limited (65536 tokens).
*
* ============================================================================
* PRACTICAL RECOMMENDATIONS FOR CODING AGENTS:
* ============================================================================
*
* Conservative cross-provider safe limits:
* - Max 2 images per request at ~5MB each (~10MB total)
* - Max 5760px dimension (for Groq pixel limit)
*
* If excluding Groq:
* - Max 4 images per request at ~5MB each (~20MB total)
* - Max 8000px dimension
*
* For Anthropic-only (most common case):
* - Max 6 images at ~3MB each OR 100 images at <200KB each
* - Max 5MB per image
* - Max 8000px dimension
* - Stay under ~18MB total request size
*
* ============================================================================
*/
import { execSync } from "node:child_process";
import { mkdirSync, rmSync } from "node:fs";
import { dirname, join } from "node:path";
import { fileURLToPath } from "node:url";
import { afterAll, beforeAll, describe, expect, it } from "vitest";
import { getModel } from "../src/models.js";
import { complete } from "../src/stream.js";
import type { Api, Context, ImageContent, Model, OptionsForApi, UserMessage } from "../src/types.js";
import { hasBedrockCredentials } from "./bedrock-utils.js";
const __filename = fileURLToPath(import.meta.url);
const __dirname = dirname(__filename);
// Temp directory for generated images
const TEMP_DIR = join(__dirname, ".temp-images");
/**
* Generate a valid PNG image of specified dimensions using ImageMagick
*/
function generateImage(width: number, height: number, filename: string): string {
const filepath = join(TEMP_DIR, filename);
execSync(`magick -size ${width}x${height} xc:red "${filepath}"`, { stdio: "ignore" });
const buffer = require("fs").readFileSync(filepath);
return buffer.toString("base64");
}
/**
* Generate a valid PNG image of approximately the specified size in bytes
*/
function generateImageWithSize(targetBytes: number, filename: string): string {
const filepath = join(TEMP_DIR, filename);
// Use uncompressed PNG to get predictable sizes
// Each pixel is 3 bytes (RGB), plus PNG overhead (~100 bytes)
// For a square image: side = sqrt(targetBytes / 3)
const side = Math.ceil(Math.sqrt(targetBytes / 3));
// Use noise pattern to prevent compression from shrinking the file
execSync(`magick -size ${side}x${side} xc: +noise Random -depth 8 PNG24:"${filepath}"`, { stdio: "ignore" });
// Check actual size and adjust if needed
const stats = require("fs").statSync(filepath);
if (stats.size < targetBytes * 0.8) {
// If too small, increase dimensions
const newSide = Math.ceil(side * Math.sqrt(targetBytes / stats.size));
execSync(`magick -size ${newSide}x${newSide} xc: +noise Random -depth 8 PNG24:"${filepath}"`, {
stdio: "ignore",
});
}
const buffer = require("fs").readFileSync(filepath);
return buffer.toString("base64");
}
/**
* Create a user message with multiple images
*/
function createMultiImageMessage(imageCount: number, imageBase64: string): UserMessage {
const content: (ImageContent | { type: "text"; text: string })[] = [
{ type: "text", text: `I am sending you ${imageCount} images. Just reply with "received ${imageCount}".` },
];
for (let i = 0; i < imageCount; i++) {
content.push({
type: "image",
data: imageBase64,
mimeType: "image/png",
});
}
return {
role: "user",
content,
timestamp: Date.now(),
};
}
/**
* Test sending a specific number of images to a model
*/
async function testImageCount<TApi extends Api>(
model: Model<TApi>,
imageCount: number,
imageBase64: string,
options?: OptionsForApi<TApi>,
): Promise<{ success: boolean; error?: string }> {
const context: Context = {
messages: [createMultiImageMessage(imageCount, imageBase64)],
};
try {
const response = await complete(model, context, options);
if (response.stopReason === "error") {
return { success: false, error: response.errorMessage };
}
return { success: true };
} catch (e) {
return { success: false, error: e instanceof Error ? e.message : String(e) };
}
}
/**
* Test sending an image of a specific size
*/
async function testImageSize<TApi extends Api>(
model: Model<TApi>,
imageBase64: string,
options?: OptionsForApi<TApi>,
): Promise<{ success: boolean; error?: string }> {
const context: Context = {
messages: [
{
role: "user",
content: [
{ type: "text", text: "I am sending you an image. Just reply with 'received'." },
{ type: "image", data: imageBase64, mimeType: "image/png" },
],
timestamp: Date.now(),
},
],
};
try {
const response = await complete(model, context, options);
if (response.stopReason === "error") {
return { success: false, error: response.errorMessage };
}
return { success: true };
} catch (e) {
return { success: false, error: e instanceof Error ? e.message : String(e) };
}
}
/**
* Test sending an image with specific dimensions
*/
async function testImageDimensions<TApi extends Api>(
model: Model<TApi>,
imageBase64: string,
options?: OptionsForApi<TApi>,
): Promise<{ success: boolean; error?: string }> {
const context: Context = {
messages: [
{
role: "user",
content: [
{ type: "text", text: "I am sending you an image. Just reply with 'received'." },
{ type: "image", data: imageBase64, mimeType: "image/png" },
],
timestamp: Date.now(),
},
],
};
try {
const response = await complete(model, context, options);
if (response.stopReason === "error") {
return { success: false, error: response.errorMessage };
}
return { success: true };
} catch (e) {
return { success: false, error: e instanceof Error ? e.message : String(e) };
}
}
/**
* Find the maximum value that succeeds using linear search
*/
async function findLimit(
testFn: (value: number) => Promise<{ success: boolean; error?: string }>,
min: number,
max: number,
step: number,
): Promise<{ limit: number; lastError?: string }> {
let lastSuccess = min;
let lastError: string | undefined;
for (let value = min; value <= max; value += step) {
console.log(` Testing value: ${value}...`);
const result = await testFn(value);
if (result.success) {
lastSuccess = value;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
return { limit: lastSuccess, lastError };
}
// =============================================================================
// Provider-specific test suites
// =============================================================================
describe("Image Limits E2E Tests", () => {
let smallImage: string; // 100x100 for count tests
beforeAll(() => {
// Create temp directory
mkdirSync(TEMP_DIR, { recursive: true });
// Generate small test image for count tests
smallImage = generateImage(100, 100, "small.png");
});
afterAll(() => {
// Clean up temp directory
rmSync(TEMP_DIR, { recursive: true, force: true });
});
// -------------------------------------------------------------------------
// Anthropic (claude-3-5-haiku-20241022)
// Limits: 100 images, 5MB per image, 8000px max dimension
// -------------------------------------------------------------------------
describe.skipIf(!process.env.ANTHROPIC_API_KEY)("Anthropic (claude-3-5-haiku-20241022)", () => {
const model = getModel("anthropic", "claude-3-5-haiku-20241022");
it("should accept a small number of images (5)", async () => {
const result = await testImageCount(model, 5, smallImage);
expect(result.success, result.error).toBe(true);
});
it("should find maximum image count limit", { timeout: 600000 }, async () => {
// Known limit: 100 images
const { limit, lastError } = await findLimit((count) => testImageCount(model, count, smallImage), 20, 120, 20);
console.log(`\n Anthropic max images: ~${limit} (last error: ${lastError})`);
expect(limit).toBeGreaterThanOrEqual(80);
expect(limit).toBeLessThanOrEqual(100);
});
it("should find maximum image size limit", { timeout: 600000 }, async () => {
const MB = 1024 * 1024;
// Known limit: 5MB per image
const sizes = [1, 2, 3, 4, 5, 6];
let lastSuccess = 0;
let lastError: string | undefined;
for (const sizeMB of sizes) {
console.log(` Testing size: ${sizeMB}MB...`);
const imageBase64 = generateImageWithSize(sizeMB * MB, `size-${sizeMB}mb.png`);
const result = await testImageSize(model, imageBase64);
if (result.success) {
lastSuccess = sizeMB;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n Anthropic max image size: ~${lastSuccess}MB (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(1);
});
it("should find maximum image dimension limit", { timeout: 600000 }, async () => {
// Known limit: 8000px
const dimensions = [1000, 2000, 4000, 6000, 8000, 10000];
let lastSuccess = 0;
let lastError: string | undefined;
for (const dim of dimensions) {
console.log(` Testing dimension: ${dim}x${dim}...`);
const imageBase64 = generateImage(dim, dim, `dim-${dim}.png`);
const result = await testImageDimensions(model, imageBase64);
if (result.success) {
lastSuccess = dim;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n Anthropic max dimension: ~${lastSuccess}px (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(6000);
expect(lastSuccess).toBeLessThanOrEqual(8000);
});
});
// -------------------------------------------------------------------------
// OpenAI (gpt-4o-mini via openai-completions)
// Limits: 500 images, ~20MB per image (documented)
// -------------------------------------------------------------------------
describe.skipIf(!process.env.OPENAI_API_KEY)("OpenAI (gpt-4o-mini)", () => {
const model: Model<"openai-completions"> = { ...getModel("openai", "gpt-4o-mini"), api: "openai-completions" };
it("should accept a small number of images (5)", async () => {
const result = await testImageCount(model, 5, smallImage);
expect(result.success, result.error).toBe(true);
});
it("should find maximum image count limit", { timeout: 600000 }, async () => {
// Known limit: 500 images
const { limit, lastError } = await findLimit(
(count) => testImageCount(model, count, smallImage),
100,
600,
100,
);
console.log(`\n OpenAI max images: ~${limit} (last error: ${lastError})`);
expect(limit).toBeGreaterThanOrEqual(400);
expect(limit).toBeLessThanOrEqual(500);
});
it("should find maximum image size limit", { timeout: 600000 }, async () => {
const MB = 1024 * 1024;
// Documented limit: 20MB
const sizes = [5, 10, 15, 20, 25];
let lastSuccess = 0;
let lastError: string | undefined;
for (const sizeMB of sizes) {
console.log(` Testing size: ${sizeMB}MB...`);
const imageBase64 = generateImageWithSize(sizeMB * MB, `size-${sizeMB}mb.png`);
const result = await testImageSize(model, imageBase64);
if (result.success) {
lastSuccess = sizeMB;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n OpenAI max image size: ~${lastSuccess}MB (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(15);
});
it("should find maximum image dimension limit", { timeout: 600000 }, async () => {
const dimensions = [2000, 4000, 8000, 16000, 20000];
let lastSuccess = 0;
let lastError: string | undefined;
for (const dim of dimensions) {
console.log(` Testing dimension: ${dim}x${dim}...`);
const imageBase64 = generateImage(dim, dim, `dim-${dim}.png`);
const result = await testImageDimensions(model, imageBase64);
if (result.success) {
lastSuccess = dim;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n OpenAI max dimension: ~${lastSuccess}px (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(2000);
});
});
// -------------------------------------------------------------------------
// Google Gemini (gemini-2.5-flash)
// Limits: Very high (~2500 images), large size support
// -------------------------------------------------------------------------
describe.skipIf(!process.env.GEMINI_API_KEY)("Gemini (gemini-2.5-flash)", () => {
const model = getModel("google", "gemini-2.5-flash");
it("should accept a small number of images (5)", async () => {
const result = await testImageCount(model, 5, smallImage);
expect(result.success, result.error).toBe(true);
});
it("should find maximum image count limit", { timeout: 900000 }, async () => {
// Known to work up to ~2500, hits errors around 3000
const { limit, lastError } = await findLimit(
(count) => testImageCount(model, count, smallImage),
500,
3000,
500,
);
console.log(`\n Gemini max images: ~${limit} (last error: ${lastError})`);
expect(limit).toBeGreaterThanOrEqual(500);
});
it("should find maximum image size limit", { timeout: 600000 }, async () => {
const MB = 1024 * 1024;
// Very permissive, tested up to 60MB successfully
const sizes = [10, 20, 30, 40];
let lastSuccess = 0;
let lastError: string | undefined;
for (const sizeMB of sizes) {
console.log(` Testing size: ${sizeMB}MB...`);
const imageBase64 = generateImageWithSize(sizeMB * MB, `size-${sizeMB}mb.png`);
const result = await testImageSize(model, imageBase64);
if (result.success) {
lastSuccess = sizeMB;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n Gemini max image size: ~${lastSuccess}MB (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(20);
});
it("should find maximum image dimension limit", { timeout: 600000 }, async () => {
const dimensions = [2000, 4000, 8000, 16000, 20000];
let lastSuccess = 0;
let lastError: string | undefined;
for (const dim of dimensions) {
console.log(` Testing dimension: ${dim}x${dim}...`);
const imageBase64 = generateImage(dim, dim, `dim-${dim}.png`);
const result = await testImageDimensions(model, imageBase64);
if (result.success) {
lastSuccess = dim;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n Gemini max dimension: ~${lastSuccess}px (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(2000);
});
});
// -------------------------------------------------------------------------
// Mistral (pixtral-12b)
// Limits: ~8 images, ~15MB per image
// -------------------------------------------------------------------------
describe.skipIf(!process.env.MISTRAL_API_KEY)("Mistral (pixtral-12b)", () => {
const model = getModel("mistral", "pixtral-12b");
it("should accept a small number of images (5)", async () => {
const result = await testImageCount(model, 5, smallImage);
expect(result.success, result.error).toBe(true);
});
it("should find maximum image count limit", { timeout: 600000 }, async () => {
// Known to fail around 9 images
const { limit, lastError } = await findLimit((count) => testImageCount(model, count, smallImage), 5, 15, 1);
console.log(`\n Mistral max images: ~${limit} (last error: ${lastError})`);
expect(limit).toBeGreaterThanOrEqual(5);
});
it("should find maximum image size limit", { timeout: 600000 }, async () => {
const MB = 1024 * 1024;
const sizes = [5, 10, 15, 20];
let lastSuccess = 0;
let lastError: string | undefined;
for (const sizeMB of sizes) {
console.log(` Testing size: ${sizeMB}MB...`);
const imageBase64 = generateImageWithSize(sizeMB * MB, `size-${sizeMB}mb.png`);
const result = await testImageSize(model, imageBase64);
if (result.success) {
lastSuccess = sizeMB;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n Mistral max image size: ~${lastSuccess}MB (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(5);
});
it("should find maximum image dimension limit", { timeout: 600000 }, async () => {
const dimensions = [2000, 4000, 8000, 16000, 20000];
let lastSuccess = 0;
let lastError: string | undefined;
for (const dim of dimensions) {
console.log(` Testing dimension: ${dim}x${dim}...`);
const imageBase64 = generateImage(dim, dim, `dim-${dim}.png`);
const result = await testImageDimensions(model, imageBase64);
if (result.success) {
lastSuccess = dim;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n Mistral max dimension: ~${lastSuccess}px (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(2000);
});
});
// -------------------------------------------------------------------------
// OpenRouter (z-ai/glm-4.5v)
// Limits: Context-window limited (~45 images at 100x100), ~15MB per image
// -------------------------------------------------------------------------
describe.skipIf(!process.env.OPENROUTER_API_KEY)("OpenRouter (z-ai/glm-4.5v)", () => {
const model = getModel("openrouter", "z-ai/glm-4.5v");
it("should accept a small number of images (5)", async () => {
const result = await testImageCount(model, 5, smallImage);
expect(result.success, result.error).toBe(true);
});
it("should find maximum image count limit", { timeout: 600000 }, async () => {
// Limited by context window, not explicit image limit
const { limit, lastError } = await findLimit((count) => testImageCount(model, count, smallImage), 10, 60, 10);
console.log(`\n OpenRouter max images: ~${limit} (last error: ${lastError})`);
expect(limit).toBeGreaterThanOrEqual(10);
});
it("should find maximum image size limit", { timeout: 600000 }, async () => {
const MB = 1024 * 1024;
const sizes = [5, 10, 15, 20];
let lastSuccess = 0;
let lastError: string | undefined;
for (const sizeMB of sizes) {
console.log(` Testing size: ${sizeMB}MB...`);
const imageBase64 = generateImageWithSize(sizeMB * MB, `size-${sizeMB}mb.png`);
const result = await testImageSize(model, imageBase64);
if (result.success) {
lastSuccess = sizeMB;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n OpenRouter max image size: ~${lastSuccess}MB (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(5);
});
it("should find maximum image dimension limit", { timeout: 600000 }, async () => {
const dimensions = [2000, 4000, 8000, 16000, 20000];
let lastSuccess = 0;
let lastError: string | undefined;
for (const dim of dimensions) {
console.log(` Testing dimension: ${dim}x${dim}...`);
const imageBase64 = generateImage(dim, dim, `dim-${dim}.png`);
const result = await testImageDimensions(model, imageBase64);
if (result.success) {
lastSuccess = dim;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n OpenRouter max dimension: ~${lastSuccess}px (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(2000);
});
});
// -------------------------------------------------------------------------
// xAI (grok-2-vision)
// -------------------------------------------------------------------------
describe.skipIf(!process.env.XAI_API_KEY)("xAI (grok-2-vision)", () => {
const model = getModel("xai", "grok-2-vision");
it("should accept a small number of images (5)", async () => {
const result = await testImageCount(model, 5, smallImage);
expect(result.success, result.error).toBe(true);
});
it("should find maximum image count limit", { timeout: 600000 }, async () => {
const { limit, lastError } = await findLimit((count) => testImageCount(model, count, smallImage), 10, 100, 10);
console.log(`\n xAI max images: ~${limit} (last error: ${lastError})`);
expect(limit).toBeGreaterThanOrEqual(5);
});
it("should find maximum image size limit", { timeout: 600000 }, async () => {
const MB = 1024 * 1024;
const sizes = [5, 10, 15, 20, 25];
let lastSuccess = 0;
let lastError: string | undefined;
for (const sizeMB of sizes) {
console.log(` Testing size: ${sizeMB}MB...`);
const imageBase64 = generateImageWithSize(sizeMB * MB, `size-${sizeMB}mb.png`);
const result = await testImageSize(model, imageBase64);
if (result.success) {
lastSuccess = sizeMB;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n xAI max image size: ~${lastSuccess}MB (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(5);
});
it("should find maximum image dimension limit", { timeout: 600000 }, async () => {
const dimensions = [2000, 4000, 8000, 16000, 20000];
let lastSuccess = 0;
let lastError: string | undefined;
for (const dim of dimensions) {
console.log(` Testing dimension: ${dim}x${dim}...`);
const imageBase64 = generateImage(dim, dim, `dim-${dim}.png`);
const result = await testImageDimensions(model, imageBase64);
if (result.success) {
lastSuccess = dim;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n xAI max dimension: ~${lastSuccess}px (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(2000);
});
});
// -------------------------------------------------------------------------
// Groq (llama-4-scout-17b)
// -------------------------------------------------------------------------
describe.skipIf(!process.env.GROQ_API_KEY)("Groq (llama-4-scout-17b)", () => {
const model = getModel("groq", "meta-llama/llama-4-scout-17b-16e-instruct");
it("should accept a small number of images (5)", async () => {
const result = await testImageCount(model, 5, smallImage);
expect(result.success, result.error).toBe(true);
});
it("should find maximum image count limit", { timeout: 600000 }, async () => {
const { limit, lastError } = await findLimit((count) => testImageCount(model, count, smallImage), 5, 50, 5);
console.log(`\n Groq max images: ~${limit} (last error: ${lastError})`);
expect(limit).toBeGreaterThanOrEqual(5);
});
it("should find maximum image size limit", { timeout: 600000 }, async () => {
const MB = 1024 * 1024;
const sizes = [1, 5, 10, 15, 20];
let lastSuccess = 0;
let lastError: string | undefined;
for (const sizeMB of sizes) {
console.log(` Testing size: ${sizeMB}MB...`);
const imageBase64 = generateImageWithSize(sizeMB * MB, `size-${sizeMB}mb.png`);
const result = await testImageSize(model, imageBase64);
if (result.success) {
lastSuccess = sizeMB;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n Groq max image size: ~${lastSuccess}MB (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(1);
});
it("should find maximum image dimension limit", { timeout: 600000 }, async () => {
const dimensions = [2000, 4000, 8000, 16000, 20000];
let lastSuccess = 0;
let lastError: string | undefined;
for (const dim of dimensions) {
console.log(` Testing dimension: ${dim}x${dim}...`);
const imageBase64 = generateImage(dim, dim, `dim-${dim}.png`);
const result = await testImageDimensions(model, imageBase64);
if (result.success) {
lastSuccess = dim;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n Groq max dimension: ~${lastSuccess}px (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(2000);
});
});
// -------------------------------------------------------------------------
// zAI (glm-4.5v)
// -------------------------------------------------------------------------
describe.skipIf(!process.env.ZAI_API_KEY)("zAI (glm-4.5v)", () => {
const model = getModel("zai", "glm-4.5v");
it("should accept a small number of images (5)", async () => {
const result = await testImageCount(model, 5, smallImage);
expect(result.success, result.error).toBe(true);
});
it("should find maximum image count limit", { timeout: 600000 }, async () => {
const { limit, lastError } = await findLimit((count) => testImageCount(model, count, smallImage), 10, 100, 10);
console.log(`\n zAI max images: ~${limit} (last error: ${lastError})`);
expect(limit).toBeGreaterThanOrEqual(5);
});
it("should find maximum image size limit", { timeout: 600000 }, async () => {
const MB = 1024 * 1024;
const sizes = [5, 10, 15, 20];
let lastSuccess = 0;
let lastError: string | undefined;
for (const sizeMB of sizes) {
console.log(` Testing size: ${sizeMB}MB...`);
const imageBase64 = generateImageWithSize(sizeMB * MB, `size-${sizeMB}mb.png`);
const result = await testImageSize(model, imageBase64);
if (result.success) {
lastSuccess = sizeMB;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n zAI max image size: ~${lastSuccess}MB (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(5);
});
it("should find maximum image dimension limit", { timeout: 600000 }, async () => {
const dimensions = [2000, 4000, 8000, 16000, 20000];
let lastSuccess = 0;
let lastError: string | undefined;
for (const dim of dimensions) {
console.log(` Testing dimension: ${dim}x${dim}...`);
const imageBase64 = generateImage(dim, dim, `dim-${dim}.png`);
const result = await testImageDimensions(model, imageBase64);
if (result.success) {
lastSuccess = dim;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n zAI max dimension: ~${lastSuccess}px (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(2000);
});
});
// -------------------------------------------------------------------------
// Vercel AI Gateway (google/gemini-2.5-flash)
// -------------------------------------------------------------------------
describe.skipIf(!process.env.AI_GATEWAY_API_KEY)("Vercel AI Gateway (google/gemini-2.5-flash)", () => {
const model = getModel("vercel-ai-gateway", "google/gemini-2.5-flash");
it("should accept a small number of images (5)", async () => {
const result = await testImageCount(model, 5, smallImage);
expect(result.success, result.error).toBe(true);
});
it("should find maximum image count limit", { timeout: 600000 }, async () => {
const { limit, lastError } = await findLimit((count) => testImageCount(model, count, smallImage), 10, 100, 10);
console.log(`\n Vercel AI Gateway max images: ~${limit} (last error: ${lastError})`);
expect(limit).toBeGreaterThanOrEqual(5);
});
it("should find maximum image size limit", { timeout: 600000 }, async () => {
const MB = 1024 * 1024;
const sizes = [5, 10, 15, 20];
let lastSuccess = 0;
let lastError: string | undefined;
for (const sizeMB of sizes) {
console.log(` Testing size: ${sizeMB}MB...`);
const imageBase64 = generateImageWithSize(sizeMB * MB, `size-${sizeMB}mb.png`);
const result = await testImageSize(model, imageBase64);
if (result.success) {
lastSuccess = sizeMB;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n Vercel AI Gateway max image size: ~${lastSuccess}MB (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(5);
});
});
// -------------------------------------------------------------------------
// Amazon Bedrock (claude-sonnet-4-5)
// Limits: 100 images (Anthropic), 5MB per image, 8000px max dimension
// -------------------------------------------------------------------------
describe.skipIf(!hasBedrockCredentials())("Amazon Bedrock (claude-sonnet-4-5)", () => {
const model = getModel("amazon-bedrock", "global.anthropic.claude-sonnet-4-5-20250929-v1:0");
it("should accept a small number of images (5)", async () => {
const result = await testImageCount(model, 5, smallImage);
expect(result.success, result.error).toBe(true);
});
it("should find maximum image count limit", { timeout: 600000 }, async () => {
// Anthropic limit: 100 images
const { limit, lastError } = await findLimit((count) => testImageCount(model, count, smallImage), 20, 120, 20);
console.log(`\n Bedrock max images: ~${limit} (last error: ${lastError})`);
expect(limit).toBeGreaterThanOrEqual(80);
expect(limit).toBeLessThanOrEqual(100);
});
it("should find maximum image size limit", { timeout: 600000 }, async () => {
const MB = 1024 * 1024;
// Anthropic limit: 5MB per image
const sizes = [1, 2, 3, 4, 5, 6];
let lastSuccess = 0;
let lastError: string | undefined;
for (const sizeMB of sizes) {
console.log(` Testing size: ${sizeMB}MB...`);
const imageBase64 = generateImageWithSize(sizeMB * MB, `size-${sizeMB}mb.png`);
const result = await testImageSize(model, imageBase64);
if (result.success) {
lastSuccess = sizeMB;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n Bedrock max image size: ~${lastSuccess}MB (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(1);
});
it("should find maximum image dimension limit", { timeout: 600000 }, async () => {
// Anthropic limit: 8000px
const dimensions = [1000, 2000, 4000, 6000, 8000, 10000];
let lastSuccess = 0;
let lastError: string | undefined;
for (const dim of dimensions) {
console.log(` Testing dimension: ${dim}x${dim}...`);
const imageBase64 = generateImage(dim, dim, `dim-${dim}.png`);
const result = await testImageDimensions(model, imageBase64);
if (result.success) {
lastSuccess = dim;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 100)}`);
break;
}
}
console.log(`\n Bedrock max dimension: ~${lastSuccess}px (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(6000);
expect(lastSuccess).toBeLessThanOrEqual(8000);
});
});
// =========================================================================
// MAX SIZE IMAGES TEST
// =========================================================================
// Tests how many images at (or near) max allowed size each provider can handle.
// This tests realistic payload limits, not just image count with tiny files.
//
// Note: A real 8kx8k noise PNG is ~183MB (exceeds all provider limits).
// So we test with images sized near each provider's actual size limit.
// =========================================================================
describe("Max Size Images (realistic payload stress test)", () => {
// Generate images at specific sizes for each provider's limit
const imageCache: Map<number, string> = new Map();
function getImageAtSize(targetMB: number): string {
if (imageCache.has(targetMB)) {
return imageCache.get(targetMB)!;
}
console.log(` Generating ~${targetMB}MB noise image...`);
const imageBase64 = generateImageWithSize(targetMB * 1024 * 1024, `stress-${targetMB}mb.png`);
const actualSize = Buffer.from(imageBase64, "base64").length;
console.log(` Actual size: ${(actualSize / 1024 / 1024).toFixed(2)}MB`);
imageCache.set(targetMB, imageBase64);
return imageBase64;
}
// Anthropic - 5MB per image limit, 32MB total request, 100 image count
// Using 3MB to stay under 5MB limit (generateImageWithSize has overhead)
it.skipIf(!process.env.ANTHROPIC_API_KEY)(
"Anthropic: max ~3MB images before rejection",
{ timeout: 900000 },
async () => {
const model = getModel("anthropic", "claude-3-5-haiku-20241022");
const image3mb = getImageAtSize(3);
// 32MB total limit / ~4MB actual = ~8 images
const counts = [1, 2, 4, 6, 8, 10, 12];
let lastSuccess = 0;
let lastError: string | undefined;
for (const count of counts) {
console.log(` Testing ${count} x ~3MB images...`);
const result = await testImageCount(model, count, image3mb);
if (result.success) {
lastSuccess = count;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 150)}`);
break;
}
}
console.log(`\n Anthropic max ~3MB images: ${lastSuccess} (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(1);
},
);
// Amazon Bedrock (Claude) - 5MB per image limit, same as Anthropic direct
// Using 3MB to stay under 5MB limit
it.skipIf(!hasBedrockCredentials())(
"Bedrock: max ~3MB images before rejection",
{ timeout: 900000 },
async () => {
const model = getModel("amazon-bedrock", "global.anthropic.claude-sonnet-4-5-20250929-v1:0");
const image3mb = getImageAtSize(3);
// Similar to Anthropic, test progressively
const counts = [1, 2, 4, 6, 8, 10, 12];
let lastSuccess = 0;
let lastError: string | undefined;
for (const count of counts) {
console.log(` Testing ${count} x ~3MB images...`);
const result = await testImageCount(model, count, image3mb);
if (result.success) {
lastSuccess = count;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 150)}`);
break;
}
}
console.log(`\n Bedrock max ~3MB images: ${lastSuccess} (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(1);
},
);
// OpenAI - 20MB per image documented, we found ≥25MB works
// Test with 15MB images to stay safely under limit
it.skipIf(!process.env.OPENAI_API_KEY)(
"OpenAI: max ~15MB images before rejection",
{ timeout: 1800000 },
async () => {
const model = getModel("openai", "gpt-4o-mini");
const image15mb = getImageAtSize(15);
// Test progressively
const counts = [1, 2, 5, 10, 20];
let lastSuccess = 0;
let lastError: string | undefined;
for (const count of counts) {
console.log(` Testing ${count} x ~15MB images...`);
const result = await testImageCount(model, count, image15mb);
if (result.success) {
lastSuccess = count;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 150)}`);
break;
}
}
console.log(`\n OpenAI max ~15MB images: ${lastSuccess} (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(1);
},
);
// Gemini - very permissive, ≥40MB per image works
// Test with 20MB images
it.skipIf(!process.env.GEMINI_API_KEY)(
"Gemini: max ~20MB images before rejection",
{ timeout: 1800000 },
async () => {
const model = getModel("google", "gemini-2.5-flash");
const image20mb = getImageAtSize(20);
// Test progressively
const counts = [1, 2, 5, 10, 20, 50];
let lastSuccess = 0;
let lastError: string | undefined;
for (const count of counts) {
console.log(` Testing ${count} x ~20MB images...`);
const result = await testImageCount(model, count, image20mb);
if (result.success) {
lastSuccess = count;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 150)}`);
break;
}
}
console.log(`\n Gemini max ~20MB images: ${lastSuccess} (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(1);
},
);
// Mistral - 8 image limit, ~15MB per image
// Test with 10MB images (safely under limit)
it.skipIf(!process.env.MISTRAL_API_KEY)(
"Mistral: max ~10MB images before rejection",
{ timeout: 600000 },
async () => {
const model = getModel("mistral", "pixtral-12b");
const image10mb = getImageAtSize(10);
// Known limit is 8 images
const counts = [1, 2, 4, 6, 8, 9];
let lastSuccess = 0;
let lastError: string | undefined;
for (const count of counts) {
console.log(` Testing ${count} x ~10MB images...`);
const result = await testImageCount(model, count, image10mb);
if (result.success) {
lastSuccess = count;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 150)}`);
break;
}
}
console.log(`\n Mistral max ~10MB images: ${lastSuccess} (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(1);
},
);
// xAI - 25MB per image limit (26214400 bytes exact)
// Test with 20MB images (safely under limit)
it.skipIf(!process.env.XAI_API_KEY)("xAI: max ~20MB images before rejection", { timeout: 1200000 }, async () => {
const model = getModel("xai", "grok-2-vision");
const image20mb = getImageAtSize(20);
// Test progressively
const counts = [1, 2, 5, 10, 20];
let lastSuccess = 0;
let lastError: string | undefined;
for (const count of counts) {
console.log(` Testing ${count} x ~20MB images...`);
const result = await testImageCount(model, count, image20mb);
if (result.success) {
lastSuccess = count;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 150)}`);
break;
}
}
console.log(`\n xAI max ~20MB images: ${lastSuccess} (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(1);
});
// Groq - very limited (5 images, ~5760px max due to 33M pixel limit)
// 8k images (64M pixels) exceed limit, so test with 5760px images instead
it.skipIf(!process.env.GROQ_API_KEY)(
"Groq: max 5760px images before rejection",
{ timeout: 600000 },
async () => {
const model = getModel("groq", "meta-llama/llama-4-scout-17b-16e-instruct");
// Generate 5760x5760 image (33177600 pixels = Groq's limit)
console.log(" Generating 5760x5760 test image for Groq...");
const image5760 = generateImage(5760, 5760, "stress-5760.png");
// Known limit is 5 images
const counts = [1, 2, 3, 4, 5, 6];
let lastSuccess = 0;
let lastError: string | undefined;
for (const count of counts) {
console.log(` Testing ${count} x 5760px images...`);
const result = await testImageCount(model, count, image5760);
if (result.success) {
lastSuccess = count;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 150)}`);
break;
}
}
console.log(`\n Groq max 5760px images: ${lastSuccess} (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(1);
},
);
// zAI - ≥20MB per image, context-window limited (65k tokens)
// Test with 15MB images
it.skipIf(!process.env.ZAI_API_KEY)("zAI: max ~15MB images before rejection", { timeout: 1200000 }, async () => {
const model = getModel("zai", "glm-4.5v");
const image15mb = getImageAtSize(15);
// Context-limited, test progressively
const counts = [1, 2, 5, 10, 20];
let lastSuccess = 0;
let lastError: string | undefined;
for (const count of counts) {
console.log(` Testing ${count} x ~15MB images...`);
const result = await testImageCount(model, count, image15mb);
if (result.success) {
lastSuccess = count;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 150)}`);
break;
}
}
console.log(`\n zAI max ~15MB images: ${lastSuccess} (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(1);
});
// OpenRouter - ~10MB per image, context-window limited (65k tokens)
// Test with 5MB images (safer size)
it.skipIf(!process.env.OPENROUTER_API_KEY)(
"OpenRouter: max ~5MB images before rejection",
{ timeout: 900000 },
async () => {
const model = getModel("openrouter", "z-ai/glm-4.5v");
const image5mb = getImageAtSize(5);
// Context-limited, test progressively
const counts = [1, 2, 5, 10, 20];
let lastSuccess = 0;
let lastError: string | undefined;
for (const count of counts) {
console.log(` Testing ${count} x ~5MB images...`);
const result = await testImageCount(model, count, image5mb);
if (result.success) {
lastSuccess = count;
console.log(` SUCCESS`);
} else {
lastError = result.error;
console.log(` FAILED: ${result.error?.substring(0, 150)}`);
break;
}
}
console.log(`\n OpenRouter max ~5MB images: ${lastSuccess} (last error: ${lastError})`);
expect(lastSuccess).toBeGreaterThanOrEqual(1);
},
);
});
});