diff --git a/packages/data/providers/cerebras/models/gemma-4-31b.json b/packages/data/providers/cerebras/models/gemma-4-31b.json index 98ea53d32..f6fa8c31b 100644 --- a/packages/data/providers/cerebras/models/gemma-4-31b.json +++ b/packages/data/providers/cerebras/models/gemma-4-31b.json @@ -42,7 +42,12 @@ "endpoints": "772bacef", "tools": "f0c1dc7e", "model_card_url": "682a4569", - "tokens_per_second": "8c3039bd" + "tokens_per_second": "8c3039bd", + "pricing": "f7bf6ae9" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30", + "pricing": { + "input": 0.99, + "output": 1.49 + } } diff --git a/packages/data/providers/deepinfra/models/deepreinforce-ai-ornith-1.0-35b.json b/packages/data/providers/deepinfra/models/deepreinforce-ai-ornith-1.0-35b.json index be825e76c..5c50ecd26 100644 --- a/packages/data/providers/deepinfra/models/deepreinforce-ai-ornith-1.0-35b.json +++ b/packages/data/providers/deepinfra/models/deepreinforce-ai-ornith-1.0-35b.json @@ -40,7 +40,11 @@ "pricing": "c7984d1d", "tools": "f0c1dc7e", "endpoints": "d8fa1080", - "quantization": "640679f9" + "quantization": "640679f9", + "description": "74c223d2", + "tagline": "61e5332e" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30", + "description": "Ornith-1.0-35B is DeepReinforce's open (MIT-licensed) agentic-coding model: an RL post-train of Qwen3.5-35B-A3B, a 35B-total / ~3B-active Mixture-of-Experts with hybrid Gated-DeltaNet attention. It targets state-of-the-art open-model coding-agent performance (SWE-bench Verified 75.6, Terminal-Bench 2.1 64.2) with a 262K-token context, thinking/reasoning mode, tool calling, and image + video understanding.", + "tagline": "Ornith-1.0-35B is DeepReinforce's open (MIT-licensed) agentic-coding model: an RL post-train of Qwen3.5-35B-A3B, a 35B-total / ~3B-active Mixture-of-Experts with hybrid Gated-DeltaNet attention." } diff --git a/packages/data/providers/deepinfra/models/minimaxai-minimax-m2.7-turbo.json b/packages/data/providers/deepinfra/models/minimaxai-minimax-m2.7-turbo.json index 28fe9cc2b..4cd9a1aea 100644 --- a/packages/data/providers/deepinfra/models/minimaxai-minimax-m2.7-turbo.json +++ b/packages/data/providers/deepinfra/models/minimaxai-minimax-m2.7-turbo.json @@ -24,8 +24,8 @@ "output": ["text"] }, "pricing": { - "input": 0.45, - "output": 2.1 + "input": 0.4, + "output": 2 }, "tools": ["function_calling"], "endpoints": ["chat_completions"], @@ -43,10 +43,10 @@ "tagline": "a6d84fdf", "capabilities": "56245a77", "modalities": "68e53d93", - "pricing": "b05048aa", + "pricing": "70b90c36", "tools": "f0c1dc7e", "endpoints": "d8fa1080", "quantization": "640679f9" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/fal/models/bria-extract-object.json b/packages/data/providers/fal/models/bria-extract-object.json new file mode 100644 index 000000000..805cd40bb --- /dev/null +++ b/packages/data/providers/fal/models/bria-extract-object.json @@ -0,0 +1,35 @@ +{ + "id": "bria/extract-object", + "name": "Extract Object", + "created_by": "bria", + "source": "official", + "description": "Bria Extract Object uses text prompts to isolate a selected object from an image and return it as an RGBA PNG with a transparent background.", + "status": "active", + "release_date": "2026-06-28", + "model_type": "image", + "page_url": "https://fal.run/bria/extract-object", + "tagline": "Bria Extract Object uses text prompts to isolate a selected object from an image and return it as an RGBA PNG with a transparent background.", + "capabilities": { + "vision": true + }, + "modalities": { + "input": ["text", "image"], + "output": ["image"] + }, + "endpoints": ["images"], + "last_seen_at": "2026-06-29", + "_generated": { + "name": "7b756530", + "description": "d3c19199", + "status": "379ac110", + "release_date": "bde5bfbb", + "model_type": "db8857fe", + "page_url": "8a58ef65", + "tagline": "d3c19199", + "capabilities": "d3117eb0", + "modalities": "bbf9b8bb", + "endpoints": "9a7c17cc", + "last_seen_at": "6717d6db" + }, + "last_updated": "2026-06-30" +} diff --git a/packages/data/providers/fal/models/fal-ai-flux-2-klein-9b.json b/packages/data/providers/fal/models/fal-ai-flux-2-klein-9b.json index 30777fc33..8b530f084 100644 --- a/packages/data/providers/fal/models/fal-ai-flux-2-klein-9b.json +++ b/packages/data/providers/fal/models/fal-ai-flux-2-klein-9b.json @@ -18,7 +18,7 @@ "output": ["image"] }, "endpoints": ["images"], - "last_seen_at": "2026-01-26", + "last_seen_at": "2026-06-30", "_generated": { "name": "929b507a", "description": "5bfd20fc", @@ -30,7 +30,7 @@ "capabilities": "8a3b232e", "modalities": "814867b9", "endpoints": "9a7c17cc", - "last_seen_at": "5c252aee" + "last_seen_at": "ebf8cb32" }, - "last_updated": "2026-05-11" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/fal/models/fal-ai-hyper3d-rodin-v2.5-fast.json b/packages/data/providers/fal/models/fal-ai-hyper3d-rodin-v2.5-fast.json index c5708c412..d54e0a372 100644 --- a/packages/data/providers/fal/models/fal-ai-hyper3d-rodin-v2.5-fast.json +++ b/packages/data/providers/fal/models/fal-ai-hyper3d-rodin-v2.5-fast.json @@ -12,7 +12,7 @@ "capabilities": { "vision": true }, - "last_seen_at": "2026-06-24", + "last_seen_at": "2026-06-29", "_generated": { "name": "4ec3d424", "description": "b361b4d3", @@ -22,7 +22,7 @@ "page_url": "935930c9", "tagline": "b361b4d3", "capabilities": "d3117eb0", - "last_seen_at": "b7ac61f6" + "last_seen_at": "6717d6db" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/fal/models/fal-ai-hyper3d-rodin-v2.5-text-to-3d-fast.json b/packages/data/providers/fal/models/fal-ai-hyper3d-rodin-v2.5-text-to-3d-fast.json index b589ad5be..a685a1910 100644 --- a/packages/data/providers/fal/models/fal-ai-hyper3d-rodin-v2.5-text-to-3d-fast.json +++ b/packages/data/providers/fal/models/fal-ai-hyper3d-rodin-v2.5-text-to-3d-fast.json @@ -12,7 +12,7 @@ "capabilities": { "vision": true }, - "last_seen_at": "2026-06-24", + "last_seen_at": "2026-06-29", "_generated": { "name": "58ba7137", "description": "b361b4d3", @@ -22,7 +22,7 @@ "page_url": "8d3a9bfe", "tagline": "b361b4d3", "capabilities": "d3117eb0", - "last_seen_at": "b7ac61f6" + "last_seen_at": "6717d6db" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/fal/models/fal-ai-topaz-upscale-video.json b/packages/data/providers/fal/models/fal-ai-topaz-upscale-video.json index fcebc8298..e5f668b11 100644 --- a/packages/data/providers/fal/models/fal-ai-topaz-upscale-video.json +++ b/packages/data/providers/fal/models/fal-ai-topaz-upscale-video.json @@ -9,7 +9,7 @@ "model_type": "other", "page_url": "https://fal.run/fal-ai/topaz/upscale/video", "tagline": "Professional-grade video upscaling using Topaz technology.", - "last_seen_at": "2026-05-26", + "last_seen_at": "2026-06-29", "_generated": { "name": "1ba50a12", "description": "57d6d065", @@ -18,7 +18,7 @@ "model_type": "ddb0b7bc", "page_url": "b5369296", "tagline": "57d6d065", - "last_seen_at": "1fa0004f" + "last_seen_at": "6717d6db" }, - "last_updated": "2026-06-03" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/fal/models/fal-ai-z-image-turbo.json b/packages/data/providers/fal/models/fal-ai-z-image-turbo.json index 0cdf9c6c9..51c4de58a 100644 --- a/packages/data/providers/fal/models/fal-ai-z-image-turbo.json +++ b/packages/data/providers/fal/models/fal-ai-z-image-turbo.json @@ -17,7 +17,7 @@ "output": ["image"] }, "endpoints": ["images"], - "last_seen_at": "2026-04-28", + "last_seen_at": "2026-06-30", "_generated": { "name": "c0b6417c", "description": "924942f7", @@ -29,7 +29,7 @@ "capabilities": "d3117eb0", "modalities": "814867b9", "endpoints": "9a7c17cc", - "last_seen_at": "52326430" + "last_seen_at": "ebf8cb32" }, - "last_updated": "2026-06-03" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/google/models/veo-2.0-generate-001.json b/packages/data/providers/google/models/veo-2.0-generate-001.json index 0b3d040a8..071327739 100644 --- a/packages/data/providers/google/models/veo-2.0-generate-001.json +++ b/packages/data/providers/google/models/veo-2.0-generate-001.json @@ -3,8 +3,8 @@ "name": "veo-2.0-generate-001", "created_by": "google", "source": "official", - "last_updated": "2026-06-29", - "status": "active", + "last_updated": "2026-06-30", + "status": "deprecated", "model_type": "video", "capabilities": { "streaming": true, @@ -23,7 +23,7 @@ "endpoints": ["generateContent", "streamGenerateContent"], "_generated": { "name": "89076b1f", - "status": "379ac110", + "status": "2e2f74dc", "model_type": "4d1b75ca", "capabilities": "fdff467b", "modalities": "85fd0565", @@ -34,12 +34,20 @@ "page_url": "089bd203", "open_weight": "68934a3e", "description": "a07bf735", - "tagline": "b16f53f3" + "tagline": "b16f53f3", + "deprecation_date": "ebf8cb32", + "successor": "712c232f" }, "family": "veo-2.0", "license": "proprietary", "page_url": "https://ai.google.dev/gemini-api/docs/models/veo-2.0-generate-001", "open_weight": false, "description": "The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 2.0 This model is deprecated and will be shut down on **June 30, 2026**; migrate to Veo 3.1 Preview or the GA models available through the Gemini Enterprise Agent Platform to avoid service interruptions. Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows. Veo 2.0 is best for standard 1080p content creation, social media assets, and high-volume video tasks that prioritize reliable character consistency and predictable sub-second generation speeds.", - "tagline": "Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows." + "tagline": "Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows.", + "deprecation_date": "2026-06-30", + "successor": [ + "veo-3.1-generate-preview", + "the GA models on the Gemini Enterprise Agent Platf", + "m" + ] } diff --git a/packages/data/providers/google/models/veo-3.0-fast-generate-001.json b/packages/data/providers/google/models/veo-3.0-fast-generate-001.json index c1d1fcf34..431700c76 100644 --- a/packages/data/providers/google/models/veo-3.0-fast-generate-001.json +++ b/packages/data/providers/google/models/veo-3.0-fast-generate-001.json @@ -4,7 +4,7 @@ "created_by": "google", "source": "official", "family": "veo-3.0", - "status": "active", + "status": "deprecated", "license": "proprietary", "model_type": "video", "modalities": { @@ -15,11 +15,19 @@ "_generated": { "name": "7f1d98ab", "family": "adc96752", - "status": "379ac110", + "status": "2e2f74dc", "license": "9186c466", "model_type": "4d1b75ca", "modalities": "94e5e9ab", - "open_weight": "68934a3e" + "open_weight": "68934a3e", + "deprecation_date": "ebf8cb32", + "successor": "b7b2c62c" }, - "last_updated": "2026-06-18" + "last_updated": "2026-06-30", + "deprecation_date": "2026-06-30", + "successor": [ + "veo-3.1-fast-generate-preview", + "the GA models on the Gemini Enterprise Agent Platf", + "m" + ] } diff --git a/packages/data/providers/google/models/veo-3.0-generate-001.json b/packages/data/providers/google/models/veo-3.0-generate-001.json index 053fdb917..02a647f44 100644 --- a/packages/data/providers/google/models/veo-3.0-generate-001.json +++ b/packages/data/providers/google/models/veo-3.0-generate-001.json @@ -4,7 +4,7 @@ "created_by": "google", "source": "official", "family": "veo-3.0", - "status": "active", + "status": "deprecated", "license": "proprietary", "model_type": "video", "modalities": { @@ -15,11 +15,19 @@ "_generated": { "name": "96869595", "family": "adc96752", - "status": "379ac110", + "status": "2e2f74dc", "license": "9186c466", "model_type": "4d1b75ca", "modalities": "94e5e9ab", - "open_weight": "68934a3e" + "open_weight": "68934a3e", + "deprecation_date": "ebf8cb32", + "successor": "712c232f" }, - "last_updated": "2026-06-18" + "last_updated": "2026-06-30", + "deprecation_date": "2026-06-30", + "successor": [ + "veo-3.1-generate-preview", + "the GA models on the Gemini Enterprise Agent Platf", + "m" + ] } diff --git a/packages/data/providers/huggingface/models/deepreinforce-ai-ornith-1.0-35b.json b/packages/data/providers/huggingface/models/deepreinforce-ai-ornith-1.0-35b.json new file mode 100644 index 000000000..03a5a250d --- /dev/null +++ b/packages/data/providers/huggingface/models/deepreinforce-ai-ornith-1.0-35b.json @@ -0,0 +1,30 @@ +{ + "id": "deepreinforce-ai/Ornith-1.0-35B", + "name": "Ornith-1.0-35B", + "created_by": "deepreinforce-ai", + "source": "official", + "release_date": "2026-06-21", + "license": "mit", + "parameters": 0, + "page_url": "https://huggingface.co/deepreinforce-ai/Ornith-1.0-35B", + "architecture": "moe", + "capabilities": { + "streaming": true, + "tool_call": true, + "fine_tuning": true + }, + "open_weight": true, + "tools": ["function_calling"], + "_generated": { + "name": "fe3b916f", + "release_date": "578c5012", + "license": "3c4c3ba5", + "parameters": "cfcd2084", + "page_url": "a4c6f0bf", + "architecture": "31b2172c", + "capabilities": "5780d00a", + "open_weight": "b326b506", + "tools": "f0c1dc7e" + }, + "last_updated": "2026-06-30" +} diff --git a/packages/data/providers/openrouter/models/poolside-laguna-xs.2-free.json b/packages/data/providers/openrouter/models/poolside-laguna-xs.2-free.json index e3a4d98f5..e09aad4fe 100644 --- a/packages/data/providers/openrouter/models/poolside-laguna-xs.2-free.json +++ b/packages/data/providers/openrouter/models/poolside-laguna-xs.2-free.json @@ -28,7 +28,11 @@ "tagline": "38c39fb4", "capabilities": "9346c8a7", "modalities": "68e53d93", - "tools": "f0c1dc7e" + "tools": "f0c1dc7e", + "status": "2e2f74dc", + "deprecation_date": "6e178682" }, - "last_updated": "2026-06-18" + "last_updated": "2026-06-30", + "status": "deprecated", + "deprecation_date": "9999-01-01" } diff --git a/packages/data/providers/openrouter/models/stepfun-step-3.5-flash.json b/packages/data/providers/openrouter/models/stepfun-step-3.5-flash.json index 802d43a72..99fb0f16e 100644 --- a/packages/data/providers/openrouter/models/stepfun-step-3.5-flash.json +++ b/packages/data/providers/openrouter/models/stepfun-step-3.5-flash.json @@ -3,10 +3,10 @@ "name": "StepFun: Step 3.5 Flash", "created_by": "stepfun", "source": "official", - "last_updated": "2026-06-29", + "last_updated": "2026-06-30", "description": "Step 3.5 Flash is StepFun's most capable open-source foundation model.", "context_window": 262144, - "max_output_tokens": 16384, + "max_output_tokens": 65536, "modalities": { "input": ["text"], "output": ["text"] @@ -18,7 +18,7 @@ "json_mode": true }, "pricing": { - "input": 0.09, + "input": 0.1, "output": 0.3, "cached_input": 0.02 }, @@ -26,10 +26,10 @@ "name": "9adbecc9", "description": "022938e2", "context_window": "4a1d32eb", - "max_output_tokens": "c76fe1d8", + "max_output_tokens": "297ce0b3", "modalities": "68e53d93", "capabilities": "9346c8a7", - "pricing": "248c0ec9", + "pricing": "341f9351", "release_date": "d017f790", "tagline": "022938e2", "tools": "f0c1dc7e", diff --git a/packages/data/providers/openrouter/models/z-ai-glm-5.1.json b/packages/data/providers/openrouter/models/z-ai-glm-5.1.json index cb9fcc817..0c130e7f3 100644 --- a/packages/data/providers/openrouter/models/z-ai-glm-5.1.json +++ b/packages/data/providers/openrouter/models/z-ai-glm-5.1.json @@ -20,8 +20,8 @@ "output": ["text"] }, "pricing": { - "input": 0.98, - "output": 3.08, + "input": 0.975, + "output": 4.3, "cached_input": 0.182 }, "tools": ["function_calling"], @@ -35,10 +35,10 @@ "tagline": "92718637", "capabilities": "03fbefb4", "modalities": "68e53d93", - "pricing": "538a22d4", + "pricing": "8922c706", "tools": "f0c1dc7e", "max_output_tokens": "f7de594e" }, - "last_updated": "2026-06-02", + "last_updated": "2026-06-30", "max_output_tokens": 131072 } diff --git a/packages/data/providers/openrouter/models/z-ai-glm-5.2.json b/packages/data/providers/openrouter/models/z-ai-glm-5.2.json index 75e46047d..126a4b056 100644 --- a/packages/data/providers/openrouter/models/z-ai-glm-5.2.json +++ b/packages/data/providers/openrouter/models/z-ai-glm-5.2.json @@ -21,7 +21,7 @@ "output": ["text"] }, "pricing": { - "input": 0.95, + "input": 0.94, "output": 3, "cached_input": 0.18 }, @@ -37,8 +37,8 @@ "tagline": "241852ce", "capabilities": "03fbefb4", "modalities": "68e53d93", - "pricing": "e6f9b227", + "pricing": "f16824eb", "tools": "f0c1dc7e" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/ar-stablelm-2-chat.json b/packages/data/providers/stability/models/ar-stablelm-2-chat.json index 93c6459b5..cc4026611 100644 --- a/packages/data/providers/stability/models/ar-stablelm-2-chat.json +++ b/packages/data/providers/stability/models/ar-stablelm-2-chat.json @@ -20,7 +20,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 7, + "huggingface_downloads": 10, "last_modified": "2024-12-06", "_generated": { "name": "878f768d", @@ -35,8 +35,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "8f14e45f", + "huggingface_downloads": "d3d94468", "last_modified": "725ace28" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/codellama13b_instruct_260k_synthesis.json b/packages/data/providers/stability/models/codellama13b_instruct_260k_synthesis.json index 4238b5bc9..d7e3f85e7 100644 --- a/packages/data/providers/stability/models/codellama13b_instruct_260k_synthesis.json +++ b/packages/data/providers/stability/models/codellama13b_instruct_260k_synthesis.json @@ -19,7 +19,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 38, + "huggingface_downloads": 36, "last_modified": "2023-11-08", "_generated": { "name": "0bfe3854", @@ -34,8 +34,8 @@ "capabilities": "0fa77dc6", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "a5771bce", + "huggingface_downloads": "19ca14e7", "last_modified": "8565ad2e" }, - "last_updated": "2026-06-20" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/japanese-instructblip-alpha.json b/packages/data/providers/stability/models/japanese-instructblip-alpha.json index a3c86b035..3c5c5bfda 100644 --- a/packages/data/providers/stability/models/japanese-instructblip-alpha.json +++ b/packages/data/providers/stability/models/japanese-instructblip-alpha.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 59, + "huggingface_downloads": 49, "last_modified": "2023-11-17", "_generated": { "name": "f328bd00", @@ -36,8 +36,8 @@ "capabilities": "944b5fe5", "modalities": "6399757e", "endpoints": "d8fa1080", - "huggingface_downloads": "093f65e0", + "huggingface_downloads": "f457c545", "last_modified": "4df53c88" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/japanese-stable-clip-vit-l-16.json b/packages/data/providers/stability/models/japanese-stable-clip-vit-l-16.json index 8c0bcc146..587423b62 100644 --- a/packages/data/providers/stability/models/japanese-stable-clip-vit-l-16.json +++ b/packages/data/providers/stability/models/japanese-stable-clip-vit-l-16.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 1660, + "huggingface_downloads": 1579, "last_modified": "2024-07-10", "_generated": { "name": "7f328791", @@ -36,8 +36,8 @@ "capabilities": "98ea92bd", "modalities": "6399757e", "endpoints": "d8fa1080", - "huggingface_downloads": "9a440050", + "huggingface_downloads": "ed422773", "last_modified": "2d84b9f9" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/japanese-stable-vlm.json b/packages/data/providers/stability/models/japanese-stable-vlm.json index 20f653a9a..a42d9bb53 100644 --- a/packages/data/providers/stability/models/japanese-stable-vlm.json +++ b/packages/data/providers/stability/models/japanese-stable-vlm.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 13, + "huggingface_downloads": 14, "last_modified": "2024-07-10", "_generated": { "name": "ccc610e4", @@ -36,8 +36,8 @@ "capabilities": "944b5fe5", "modalities": "6399757e", "endpoints": "d8fa1080", - "huggingface_downloads": "c51ce410", + "huggingface_downloads": "aab32389", "last_modified": "2d84b9f9" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/japanese-stablelm-3b-4e1t-base.json b/packages/data/providers/stability/models/japanese-stablelm-3b-4e1t-base.json index 343170732..1ce44aeb5 100644 --- a/packages/data/providers/stability/models/japanese-stablelm-3b-4e1t-base.json +++ b/packages/data/providers/stability/models/japanese-stablelm-3b-4e1t-base.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 48, + "huggingface_downloads": 45, "last_modified": "2024-04-26", "_generated": { "name": "e0176872", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "642e92ef", + "huggingface_downloads": "6c8349cc", "last_modified": "25e66158" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/japanese-stablelm-3b-4e1t-instruct.json b/packages/data/providers/stability/models/japanese-stablelm-3b-4e1t-instruct.json index 4689fe412..fff543ec1 100644 --- a/packages/data/providers/stability/models/japanese-stablelm-3b-4e1t-instruct.json +++ b/packages/data/providers/stability/models/japanese-stablelm-3b-4e1t-instruct.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 148, + "huggingface_downloads": 147, "last_modified": "2024-04-26", "_generated": { "name": "036b64b3", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "47d1e990", + "huggingface_downloads": "8d5e957f", "last_modified": "25e66158" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/japanese-stablelm-base-alpha-7b.json b/packages/data/providers/stability/models/japanese-stablelm-base-alpha-7b.json index c362e57a7..2eea3e131 100644 --- a/packages/data/providers/stability/models/japanese-stablelm-base-alpha-7b.json +++ b/packages/data/providers/stability/models/japanese-stablelm-base-alpha-7b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 330, + "huggingface_downloads": 310, "last_modified": "2023-08-22", "_generated": { "name": "2ba675d8", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "fe73f687", + "huggingface_downloads": "06eb61b8", "last_modified": "74743675" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/japanese-stablelm-base-beta-70b.json b/packages/data/providers/stability/models/japanese-stablelm-base-beta-70b.json index 2a43a173e..17e1708b4 100644 --- a/packages/data/providers/stability/models/japanese-stablelm-base-beta-70b.json +++ b/packages/data/providers/stability/models/japanese-stablelm-base-beta-70b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 127, + "huggingface_downloads": 126, "last_modified": "2023-12-19", "_generated": { "name": "d4722d0b", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "ec5decca", + "huggingface_downloads": "069059b7", "last_modified": "306375dc" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/japanese-stablelm-base-beta-7b.json b/packages/data/providers/stability/models/japanese-stablelm-base-beta-7b.json index 9106b11a5..04a5c5a09 100644 --- a/packages/data/providers/stability/models/japanese-stablelm-base-beta-7b.json +++ b/packages/data/providers/stability/models/japanese-stablelm-base-beta-7b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 50, + "huggingface_downloads": 48, "last_modified": "2023-12-19", "_generated": { "name": "fd70cf93", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "c0c7c76d", + "huggingface_downloads": "642e92ef", "last_modified": "306375dc" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/japanese-stablelm-base-ja_vocab-beta-7b.json b/packages/data/providers/stability/models/japanese-stablelm-base-ja_vocab-beta-7b.json index 678f8c1ee..e33cbc986 100644 --- a/packages/data/providers/stability/models/japanese-stablelm-base-ja_vocab-beta-7b.json +++ b/packages/data/providers/stability/models/japanese-stablelm-base-ja_vocab-beta-7b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 40, + "huggingface_downloads": 39, "last_modified": "2023-12-19", "_generated": { "name": "0627ce1b", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "d645920e", + "huggingface_downloads": "d67d8ab4", "last_modified": "306375dc" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/japanese-stablelm-instruct-alpha-7b-v2.json b/packages/data/providers/stability/models/japanese-stablelm-instruct-alpha-7b-v2.json index a4789de73..7cc14e03b 100644 --- a/packages/data/providers/stability/models/japanese-stablelm-instruct-alpha-7b-v2.json +++ b/packages/data/providers/stability/models/japanese-stablelm-instruct-alpha-7b-v2.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 40, + "huggingface_downloads": 38, "last_modified": "2023-10-06", "_generated": { "name": "9383bbab", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "d645920e", + "huggingface_downloads": "a5771bce", "last_modified": "b713276e" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/japanese-stablelm-instruct-ja_vocab-beta-7b.json b/packages/data/providers/stability/models/japanese-stablelm-instruct-ja_vocab-beta-7b.json index 49f08b0ba..f6c745305 100644 --- a/packages/data/providers/stability/models/japanese-stablelm-instruct-ja_vocab-beta-7b.json +++ b/packages/data/providers/stability/models/japanese-stablelm-instruct-ja_vocab-beta-7b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 45, + "huggingface_downloads": 44, "last_modified": "2023-12-19", "_generated": { "name": "0c14ddd1", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "6c8349cc", + "huggingface_downloads": "f7177163", "last_modified": "306375dc" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/same-l.json b/packages/data/providers/stability/models/same-l.json index f6668b814..a3a8779ce 100644 --- a/packages/data/providers/stability/models/same-l.json +++ b/packages/data/providers/stability/models/same-l.json @@ -20,7 +20,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 6323, + "huggingface_downloads": 6334, "last_modified": "2026-06-24", "_generated": { "name": "eb4ee27e", @@ -35,8 +35,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "14eac0d2", + "huggingface_downloads": "d0cffa36", "last_modified": "b7ac61f6" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/same-s.json b/packages/data/providers/stability/models/same-s.json index bc34b66da..469cd511c 100644 --- a/packages/data/providers/stability/models/same-s.json +++ b/packages/data/providers/stability/models/same-s.json @@ -20,7 +20,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 1549, + "huggingface_downloads": 1587, "last_modified": "2026-05-19", "_generated": { "name": "ec279f3f", @@ -35,8 +35,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "c88d8d0a", + "huggingface_downloads": "49af6c4e", "last_modified": "665f01a0" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/sd-turbo.json b/packages/data/providers/stability/models/sd-turbo.json index 2c5a87a36..6be380c23 100644 --- a/packages/data/providers/stability/models/sd-turbo.json +++ b/packages/data/providers/stability/models/sd-turbo.json @@ -18,7 +18,7 @@ "output": ["image"] }, "endpoints": ["images"], - "huggingface_downloads": 698263, + "huggingface_downloads": 684119, "last_modified": "2024-07-10", "_generated": { "name": "66a258a1", @@ -32,8 +32,8 @@ "capabilities": "d3117eb0", "modalities": "814867b9", "endpoints": "9a7c17cc", - "huggingface_downloads": "a28f6eb9", + "huggingface_downloads": "716e3267", "last_modified": "2d84b9f9" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/sd-vae-ft-ema.json b/packages/data/providers/stability/models/sd-vae-ft-ema.json index ea1132dfc..318a2dbec 100644 --- a/packages/data/providers/stability/models/sd-vae-ft-ema.json +++ b/packages/data/providers/stability/models/sd-vae-ft-ema.json @@ -11,7 +11,7 @@ "page_url": "https://huggingface.co/stabilityai/sd-vae-ft-ema", "open_weight": true, "tagline": "Sd Vae Ft Ema is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 7037, + "huggingface_downloads": 6837, "last_modified": "2023-06-05", "_generated": { "name": "46031e67", @@ -23,8 +23,8 @@ "page_url": "3f87a050", "open_weight": "b326b506", "tagline": "2b74ba71", - "huggingface_downloads": "7c39a5f9", + "huggingface_downloads": "176bf621", "last_modified": "03590c01" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/sd-vae-ft-mse.json b/packages/data/providers/stability/models/sd-vae-ft-mse.json index 40c7c0ecf..f32e81a85 100644 --- a/packages/data/providers/stability/models/sd-vae-ft-mse.json +++ b/packages/data/providers/stability/models/sd-vae-ft-mse.json @@ -11,7 +11,7 @@ "page_url": "https://huggingface.co/stabilityai/sd-vae-ft-mse", "open_weight": true, "tagline": "Sd Vae Ft Mse is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 102468, + "huggingface_downloads": 102400, "last_modified": "2023-06-06", "_generated": { "name": "ca2fd865", @@ -23,8 +23,8 @@ "page_url": "6abc04ea", "open_weight": "b326b506", "tagline": "d27bf42e", - "huggingface_downloads": "23276655", + "huggingface_downloads": "c0cae821", "last_modified": "f4c30a96" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/sd-x2-latent-upscaler.json b/packages/data/providers/stability/models/sd-x2-latent-upscaler.json index 7e7e6b929..ab38dfef6 100644 --- a/packages/data/providers/stability/models/sd-x2-latent-upscaler.json +++ b/packages/data/providers/stability/models/sd-x2-latent-upscaler.json @@ -11,7 +11,7 @@ "page_url": "https://huggingface.co/stabilityai/sd-x2-latent-upscaler", "open_weight": true, "tagline": "Sd X2 Latent Upscaler is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 130271, + "huggingface_downloads": 129146, "last_modified": "2023-06-05", "_generated": { "name": "b710889b", @@ -23,8 +23,8 @@ "page_url": "458fd053", "open_weight": "b326b506", "tagline": "07563b02", - "huggingface_downloads": "d64f2ac9", + "huggingface_downloads": "505233af", "last_modified": "03590c01" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/sdxl-turbo-tensorrt.json b/packages/data/providers/stability/models/sdxl-turbo-tensorrt.json index 30bf7c1d6..25c1c3c35 100644 --- a/packages/data/providers/stability/models/sdxl-turbo-tensorrt.json +++ b/packages/data/providers/stability/models/sdxl-turbo-tensorrt.json @@ -20,7 +20,7 @@ "output": ["image"] }, "endpoints": ["images"], - "huggingface_downloads": 29, + "huggingface_downloads": 30, "last_modified": "2025-10-20", "_generated": { "name": "68d1174d", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "814867b9", "endpoints": "9a7c17cc", - "huggingface_downloads": "6ea9ab1b", + "huggingface_downloads": "34173cb3", "last_modified": "ba1efbec" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/sdxl-turbo.json b/packages/data/providers/stability/models/sdxl-turbo.json index 09a3419ec..f87bd6872 100644 --- a/packages/data/providers/stability/models/sdxl-turbo.json +++ b/packages/data/providers/stability/models/sdxl-turbo.json @@ -20,7 +20,7 @@ "output": ["image"] }, "endpoints": ["images"], - "huggingface_downloads": 609582, + "huggingface_downloads": 597950, "last_modified": "2024-07-10", "_generated": { "name": "f087df7a", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "814867b9", "endpoints": "9a7c17cc", - "huggingface_downloads": "5277e7fd", + "huggingface_downloads": "c352cd30", "last_modified": "2d84b9f9" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/sdxl-vae.json b/packages/data/providers/stability/models/sdxl-vae.json index 9ebc6b23a..61dde3e08 100644 --- a/packages/data/providers/stability/models/sdxl-vae.json +++ b/packages/data/providers/stability/models/sdxl-vae.json @@ -11,7 +11,7 @@ "page_url": "https://huggingface.co/stabilityai/sdxl-vae", "open_weight": true, "tagline": "Sdxl Vae is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 263433, + "huggingface_downloads": 259409, "last_modified": "2023-08-04", "_generated": { "name": "61bd1f43", @@ -23,8 +23,8 @@ "page_url": "f1404dbb", "open_weight": "b326b506", "tagline": "e2452bea", - "huggingface_downloads": "fedfb824", + "huggingface_downloads": "33838f8f", "last_modified": "8839bf02" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/sp4d.json b/packages/data/providers/stability/models/sp4d.json index 340a51e92..ceb9dbb42 100644 --- a/packages/data/providers/stability/models/sp4d.json +++ b/packages/data/providers/stability/models/sp4d.json @@ -11,7 +11,7 @@ "page_url": "https://huggingface.co/stabilityai/sp4d", "open_weight": true, "tagline": "Sp4d is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 15, + "huggingface_downloads": 12, "last_modified": "2025-11-05", "_generated": { "name": "457a0272", @@ -23,8 +23,8 @@ "page_url": "f1bc6a46", "open_weight": "b326b506", "tagline": "03685677", - "huggingface_downloads": "9bf31c7f", + "huggingface_downloads": "c20ad4d7", "last_modified": "6c2625ef" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-audio-3-medium-base.json b/packages/data/providers/stability/models/stable-audio-3-medium-base.json index d20e8175a..804bc2c01 100644 --- a/packages/data/providers/stability/models/stable-audio-3-medium-base.json +++ b/packages/data/providers/stability/models/stable-audio-3-medium-base.json @@ -11,7 +11,7 @@ "page_url": "https://huggingface.co/stabilityai/stable-audio-3-medium-base", "open_weight": true, "tagline": "Stable Audio 3 Medium Base is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 4312, + "huggingface_downloads": 4447, "last_modified": "2026-06-16", "_generated": { "name": "8bbce982", @@ -23,8 +23,8 @@ "page_url": "88125143", "open_weight": "b326b506", "tagline": "efd9b285", - "huggingface_downloads": "27d8d40b", + "huggingface_downloads": "6fd6b030", "last_modified": "3eed1aa6" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-audio-3-medium.json b/packages/data/providers/stability/models/stable-audio-3-medium.json index 4c622675c..8464ab249 100644 --- a/packages/data/providers/stability/models/stable-audio-3-medium.json +++ b/packages/data/providers/stability/models/stable-audio-3-medium.json @@ -11,7 +11,7 @@ "page_url": "https://huggingface.co/stabilityai/stable-audio-3-medium", "open_weight": true, "tagline": "Stable Audio 3 Medium is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 59946, + "huggingface_downloads": 57092, "last_modified": "2026-06-16", "_generated": { "name": "876218de", @@ -23,8 +23,8 @@ "page_url": "21ce02fa", "open_weight": "b326b506", "tagline": "1eed9084", - "huggingface_downloads": "880c0424", + "huggingface_downloads": "30ffe7c0", "last_modified": "3eed1aa6" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-audio-3-small-music-base.json b/packages/data/providers/stability/models/stable-audio-3-small-music-base.json index 76d124231..d1e63455a 100644 --- a/packages/data/providers/stability/models/stable-audio-3-small-music-base.json +++ b/packages/data/providers/stability/models/stable-audio-3-small-music-base.json @@ -11,7 +11,7 @@ "page_url": "https://huggingface.co/stabilityai/stable-audio-3-small-music-base", "open_weight": true, "tagline": "Stable Audio 3 Small Music Base is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 1769, + "huggingface_downloads": 1747, "last_modified": "2026-05-20", "_generated": { "name": "467580cd", @@ -23,8 +23,8 @@ "page_url": "c7772e44", "open_weight": "b326b506", "tagline": "50ceceff", - "huggingface_downloads": "7eb7eabb", + "huggingface_downloads": "3e15cc11", "last_modified": "7a81e6e3" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-audio-3-small-music.json b/packages/data/providers/stability/models/stable-audio-3-small-music.json index 2f887d16d..b77c77d4d 100644 --- a/packages/data/providers/stability/models/stable-audio-3-small-music.json +++ b/packages/data/providers/stability/models/stable-audio-3-small-music.json @@ -11,7 +11,7 @@ "page_url": "https://huggingface.co/stabilityai/stable-audio-3-small-music", "open_weight": true, "tagline": "Stable Audio 3 Small Music is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 15603, + "huggingface_downloads": 15375, "last_modified": "2026-05-19", "_generated": { "name": "f5e21a2b", @@ -23,8 +23,8 @@ "page_url": "2c770fc1", "open_weight": "b326b506", "tagline": "eb65778e", - "huggingface_downloads": "b39f604b", + "huggingface_downloads": "73926ad4", "last_modified": "665f01a0" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-audio-3-small-sfx-base.json b/packages/data/providers/stability/models/stable-audio-3-small-sfx-base.json index 7c5ca335e..722428286 100644 --- a/packages/data/providers/stability/models/stable-audio-3-small-sfx-base.json +++ b/packages/data/providers/stability/models/stable-audio-3-small-sfx-base.json @@ -11,7 +11,7 @@ "page_url": "https://huggingface.co/stabilityai/stable-audio-3-small-sfx-base", "open_weight": true, "tagline": "Stable Audio 3 Small Sfx Base is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 1054, + "huggingface_downloads": 1064, "last_modified": "2026-05-20", "_generated": { "name": "81a44e64", @@ -23,8 +23,8 @@ "page_url": "01e67b4a", "open_weight": "b326b506", "tagline": "ff9b4547", - "huggingface_downloads": "db576a7d", + "huggingface_downloads": "2290a738", "last_modified": "7a81e6e3" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-audio-3-small-sfx.json b/packages/data/providers/stability/models/stable-audio-3-small-sfx.json index 48f22b624..66167fda3 100644 --- a/packages/data/providers/stability/models/stable-audio-3-small-sfx.json +++ b/packages/data/providers/stability/models/stable-audio-3-small-sfx.json @@ -11,7 +11,7 @@ "page_url": "https://huggingface.co/stabilityai/stable-audio-3-small-sfx", "open_weight": true, "tagline": "Stable Audio 3 Small Sfx is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 12006, + "huggingface_downloads": 12045, "last_modified": "2026-05-19", "_generated": { "name": "86c5e6d0", @@ -23,8 +23,8 @@ "page_url": "6a088c2a", "open_weight": "b326b506", "tagline": "801babc4", - "huggingface_downloads": "ef126722", + "huggingface_downloads": "fb598cb4", "last_modified": "665f01a0" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-audio-open-1.0.json b/packages/data/providers/stability/models/stable-audio-open-1.0.json index 6f466f745..bef259330 100644 --- a/packages/data/providers/stability/models/stable-audio-open-1.0.json +++ b/packages/data/providers/stability/models/stable-audio-open-1.0.json @@ -16,7 +16,7 @@ "fine_tuning": true }, "tools": ["function_calling"], - "huggingface_downloads": 26532, + "huggingface_downloads": 25989, "last_modified": "2025-06-19", "_generated": { "name": "ff7cb910", @@ -30,8 +30,8 @@ "tagline": "0822e325", "capabilities": "5de6a2be", "tools": "f0c1dc7e", - "huggingface_downloads": "83870fb9", + "huggingface_downloads": "834520f1", "last_modified": "dc9b2bc0" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-audio-open-small.json b/packages/data/providers/stability/models/stable-audio-open-small.json index 53388d37a..d43796f94 100644 --- a/packages/data/providers/stability/models/stable-audio-open-small.json +++ b/packages/data/providers/stability/models/stable-audio-open-small.json @@ -16,7 +16,7 @@ "fine_tuning": true }, "tools": ["function_calling"], - "huggingface_downloads": 2235, + "huggingface_downloads": 2169, "last_modified": "2025-05-27", "_generated": { "name": "cedaf559", @@ -30,8 +30,8 @@ "tagline": "8d9b7098", "capabilities": "5de6a2be", "tools": "f0c1dc7e", - "huggingface_downloads": "b0b79da5", + "huggingface_downloads": "bd0cc810", "last_modified": "2c4f5431" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-cascade-prior.json b/packages/data/providers/stability/models/stable-cascade-prior.json index 2f4f6e63e..b956f96e8 100644 --- a/packages/data/providers/stability/models/stable-cascade-prior.json +++ b/packages/data/providers/stability/models/stable-cascade-prior.json @@ -20,7 +20,7 @@ "output": ["image"] }, "endpoints": ["images"], - "huggingface_downloads": 789, + "huggingface_downloads": 796, "last_modified": "2024-03-14", "_generated": { "name": "f0c97102", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "814867b9", "endpoints": "9a7c17cc", - "huggingface_downloads": "68053af2", + "huggingface_downloads": "35cf8659", "last_modified": "72223066" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-cascade.json b/packages/data/providers/stability/models/stable-cascade.json index fc4680cc9..1f02bb952 100644 --- a/packages/data/providers/stability/models/stable-cascade.json +++ b/packages/data/providers/stability/models/stable-cascade.json @@ -20,7 +20,7 @@ "output": ["image"] }, "endpoints": ["images"], - "huggingface_downloads": 8252, + "huggingface_downloads": 8407, "last_modified": "2024-03-16", "_generated": { "name": "e3c7218e", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "814867b9", "endpoints": "9a7c17cc", - "huggingface_downloads": "88b05733", + "huggingface_downloads": "5112277e", "last_modified": "ab6420da" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-code-3b.json b/packages/data/providers/stability/models/stable-code-3b.json index 7213bdd9d..dbe6d4c0b 100644 --- a/packages/data/providers/stability/models/stable-code-3b.json +++ b/packages/data/providers/stability/models/stable-code-3b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 5918, + "huggingface_downloads": 5825, "last_modified": "2024-07-10", "_generated": { "name": "72288c95", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "15ae3b9d", + "huggingface_downloads": "c5a0ac0e", "last_modified": "2d84b9f9" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-code-instruct-3b.json b/packages/data/providers/stability/models/stable-code-instruct-3b.json index f3337dde1..d34550693 100644 --- a/packages/data/providers/stability/models/stable-code-instruct-3b.json +++ b/packages/data/providers/stability/models/stable-code-instruct-3b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 2335, + "huggingface_downloads": 2318, "last_modified": "2024-07-10", "_generated": { "name": "e3b8e511", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "7b4773c0", + "huggingface_downloads": "426f990b", "last_modified": "2d84b9f9" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-diffusion-3-medium-amdnpu.json b/packages/data/providers/stability/models/stable-diffusion-3-medium-amdnpu.json index c7dcadf04..3886f07cf 100644 --- a/packages/data/providers/stability/models/stable-diffusion-3-medium-amdnpu.json +++ b/packages/data/providers/stability/models/stable-diffusion-3-medium-amdnpu.json @@ -20,7 +20,7 @@ "output": ["image"] }, "endpoints": ["images"], - "huggingface_downloads": 27, + "huggingface_downloads": 31, "last_modified": "2026-05-05", "_generated": { "name": "64ed1575", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "814867b9", "endpoints": "9a7c17cc", - "huggingface_downloads": "02e74f10", + "huggingface_downloads": "c16a5320", "last_modified": "ab530d19" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-diffusion-3-medium-diffusers.json b/packages/data/providers/stability/models/stable-diffusion-3-medium-diffusers.json index 834b55bbb..0cd924a84 100644 --- a/packages/data/providers/stability/models/stable-diffusion-3-medium-diffusers.json +++ b/packages/data/providers/stability/models/stable-diffusion-3-medium-diffusers.json @@ -20,7 +20,7 @@ "output": ["image"] }, "endpoints": ["images"], - "huggingface_downloads": 33289, + "huggingface_downloads": 32528, "last_modified": "2024-06-19", "_generated": { "name": "78aabedd", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "814867b9", "endpoints": "9a7c17cc", - "huggingface_downloads": "6cdc8dc1", + "huggingface_downloads": "91c54670", "last_modified": "15de15c0" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-diffusion-3-medium.json b/packages/data/providers/stability/models/stable-diffusion-3-medium.json index 20e984bae..ca77aa6c3 100644 --- a/packages/data/providers/stability/models/stable-diffusion-3-medium.json +++ b/packages/data/providers/stability/models/stable-diffusion-3-medium.json @@ -20,7 +20,7 @@ "output": ["image"] }, "endpoints": ["images"], - "huggingface_downloads": 3481, + "huggingface_downloads": 3491, "last_modified": "2024-08-12", "_generated": { "name": "eafb868d", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "814867b9", "endpoints": "9a7c17cc", - "huggingface_downloads": "3fb04953", + "huggingface_downloads": "6c91724b", "last_modified": "946d44f9" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-diffusion-3.5-large-tensorrt.json b/packages/data/providers/stability/models/stable-diffusion-3.5-large-tensorrt.json index b399a7e8d..ad5057c46 100644 --- a/packages/data/providers/stability/models/stable-diffusion-3.5-large-tensorrt.json +++ b/packages/data/providers/stability/models/stable-diffusion-3.5-large-tensorrt.json @@ -20,7 +20,7 @@ "output": ["image"] }, "endpoints": ["images"], - "huggingface_downloads": 1469, + "huggingface_downloads": 1483, "last_modified": "2025-10-20", "_generated": { "name": "c716fe33", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "814867b9", "endpoints": "9a7c17cc", - "huggingface_downloads": "991de292", + "huggingface_downloads": "bffc9834", "last_modified": "ba1efbec" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-diffusion-3.5-medium-tensorrt.json b/packages/data/providers/stability/models/stable-diffusion-3.5-medium-tensorrt.json index 2156eb442..99cda3890 100644 --- a/packages/data/providers/stability/models/stable-diffusion-3.5-medium-tensorrt.json +++ b/packages/data/providers/stability/models/stable-diffusion-3.5-medium-tensorrt.json @@ -20,7 +20,7 @@ "output": ["image"] }, "endpoints": ["images"], - "huggingface_downloads": 9, + "huggingface_downloads": 12, "last_modified": "2025-10-20", "_generated": { "name": "5ff1dfdb", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "814867b9", "endpoints": "9a7c17cc", - "huggingface_downloads": "45c48cce", + "huggingface_downloads": "c20ad4d7", "last_modified": "ba1efbec" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-diffusion-x4-upscaler.json b/packages/data/providers/stability/models/stable-diffusion-x4-upscaler.json index 81571bb4f..f5155c8d7 100644 --- a/packages/data/providers/stability/models/stable-diffusion-x4-upscaler.json +++ b/packages/data/providers/stability/models/stable-diffusion-x4-upscaler.json @@ -11,7 +11,7 @@ "page_url": "https://huggingface.co/stabilityai/stable-diffusion-x4-upscaler", "open_weight": true, "tagline": "Stable Diffusion X4 Upscaler is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 10328, + "huggingface_downloads": 10040, "last_modified": "2023-07-05", "_generated": { "name": "a20c3000", @@ -23,8 +23,8 @@ "page_url": "fc4767fe", "open_weight": "b326b506", "tagline": "7dcec512", - "huggingface_downloads": "e6b738ec", + "huggingface_downloads": "f250daff", "last_modified": "3e5171a5" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-diffusion-xl-1.0-tensorrt.json b/packages/data/providers/stability/models/stable-diffusion-xl-1.0-tensorrt.json index dd1f131c4..57f6a1bb2 100644 --- a/packages/data/providers/stability/models/stable-diffusion-xl-1.0-tensorrt.json +++ b/packages/data/providers/stability/models/stable-diffusion-xl-1.0-tensorrt.json @@ -20,7 +20,7 @@ "output": ["image"] }, "endpoints": ["images"], - "huggingface_downloads": 275, + "huggingface_downloads": 276, "last_modified": "2025-10-20", "_generated": { "name": "947e9976", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "814867b9", "endpoints": "9a7c17cc", - "huggingface_downloads": "63923f49", + "huggingface_downloads": "db8e1af0", "last_modified": "ba1efbec" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-diffusion-xl-base-0.9.json b/packages/data/providers/stability/models/stable-diffusion-xl-base-0.9.json index 6da8b8d76..d8ab23eb5 100644 --- a/packages/data/providers/stability/models/stable-diffusion-xl-base-0.9.json +++ b/packages/data/providers/stability/models/stable-diffusion-xl-base-0.9.json @@ -20,7 +20,7 @@ "output": ["image"] }, "endpoints": ["images"], - "huggingface_downloads": 48, + "huggingface_downloads": 51, "last_modified": "2023-07-12", "_generated": { "name": "0e45d5d2", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "814867b9", "endpoints": "9a7c17cc", - "huggingface_downloads": "642e92ef", + "huggingface_downloads": "2838023a", "last_modified": "10fafc2e" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-diffusion-xl-base-1.0.json b/packages/data/providers/stability/models/stable-diffusion-xl-base-1.0.json index 0c4078074..418f8eb25 100644 --- a/packages/data/providers/stability/models/stable-diffusion-xl-base-1.0.json +++ b/packages/data/providers/stability/models/stable-diffusion-xl-base-1.0.json @@ -20,7 +20,7 @@ "output": ["image"] }, "endpoints": ["images"], - "huggingface_downloads": 1324082, + "huggingface_downloads": 1323188, "last_modified": "2023-10-30", "_generated": { "name": "39a40ead", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "814867b9", "endpoints": "9a7c17cc", - "huggingface_downloads": "2836cbc4", + "huggingface_downloads": "21396a2b", "last_modified": "ca1bf8a0" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-diffusion-xl-refiner-0.9.json b/packages/data/providers/stability/models/stable-diffusion-xl-refiner-0.9.json index fa79f3f88..218732a75 100644 --- a/packages/data/providers/stability/models/stable-diffusion-xl-refiner-0.9.json +++ b/packages/data/providers/stability/models/stable-diffusion-xl-refiner-0.9.json @@ -20,7 +20,7 @@ "output": ["image"] }, "endpoints": ["images"], - "huggingface_downloads": 45, + "huggingface_downloads": 48, "last_modified": "2023-07-12", "_generated": { "name": "12134189", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "bbf9b8bb", "endpoints": "9a7c17cc", - "huggingface_downloads": "6c8349cc", + "huggingface_downloads": "642e92ef", "last_modified": "10fafc2e" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-diffusion-xl-refiner-1.0.json b/packages/data/providers/stability/models/stable-diffusion-xl-refiner-1.0.json index 6e49f7b2d..258a3cf13 100644 --- a/packages/data/providers/stability/models/stable-diffusion-xl-refiner-1.0.json +++ b/packages/data/providers/stability/models/stable-diffusion-xl-refiner-1.0.json @@ -20,7 +20,7 @@ "output": ["image"] }, "endpoints": ["images"], - "huggingface_downloads": 163793, + "huggingface_downloads": 161798, "last_modified": "2023-09-25", "_generated": { "name": "abfa186d", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "bbf9b8bb", "endpoints": "9a7c17cc", - "huggingface_downloads": "6d8c3fab", + "huggingface_downloads": "ada4ae0c", "last_modified": "c97eddf5" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-fast-3d.json b/packages/data/providers/stability/models/stable-fast-3d.json index afd3765ab..63761d07f 100644 --- a/packages/data/providers/stability/models/stable-fast-3d.json +++ b/packages/data/providers/stability/models/stable-fast-3d.json @@ -15,7 +15,7 @@ "vision": true, "fine_tuning": true }, - "huggingface_downloads": 11960, + "huggingface_downloads": 11721, "last_modified": "2025-04-08", "_generated": { "name": "0fab393a", @@ -28,8 +28,8 @@ "open_weight": "b326b506", "tagline": "5f201e26", "capabilities": "ea60b262", - "huggingface_downloads": "deb18dd9", + "huggingface_downloads": "2b2e7393", "last_modified": "69fc7fbd" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-video-diffusion-img2vid-xt-1-1.json b/packages/data/providers/stability/models/stable-video-diffusion-img2vid-xt-1-1.json index f50fcb68c..d50c5ba22 100644 --- a/packages/data/providers/stability/models/stable-video-diffusion-img2vid-xt-1-1.json +++ b/packages/data/providers/stability/models/stable-video-diffusion-img2vid-xt-1-1.json @@ -20,7 +20,7 @@ "output": ["video"] }, "endpoints": ["video"], - "huggingface_downloads": 7772, + "huggingface_downloads": 7755, "last_modified": "2024-07-10", "_generated": { "name": "56b3650f", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "85fd0565", "endpoints": "7a78c070", - "huggingface_downloads": "36e51f22", + "huggingface_downloads": "10493aa8", "last_modified": "2d84b9f9" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-video-diffusion-img2vid-xt.json b/packages/data/providers/stability/models/stable-video-diffusion-img2vid-xt.json index c90b2bfcb..7b3297853 100644 --- a/packages/data/providers/stability/models/stable-video-diffusion-img2vid-xt.json +++ b/packages/data/providers/stability/models/stable-video-diffusion-img2vid-xt.json @@ -20,7 +20,7 @@ "output": ["video"] }, "endpoints": ["video"], - "huggingface_downloads": 218304, + "huggingface_downloads": 216367, "last_modified": "2024-07-10", "_generated": { "name": "e905da6a", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "85fd0565", "endpoints": "7a78c070", - "huggingface_downloads": "22df33a0", + "huggingface_downloads": "05d393e9", "last_modified": "2d84b9f9" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stable-video-diffusion-img2vid.json b/packages/data/providers/stability/models/stable-video-diffusion-img2vid.json index e0d37c980..eead3743f 100644 --- a/packages/data/providers/stability/models/stable-video-diffusion-img2vid.json +++ b/packages/data/providers/stability/models/stable-video-diffusion-img2vid.json @@ -20,7 +20,7 @@ "output": ["video"] }, "endpoints": ["video"], - "huggingface_downloads": 32007, + "huggingface_downloads": 31140, "last_modified": "2024-07-10", "_generated": { "name": "f434ca86", @@ -35,8 +35,8 @@ "capabilities": "ea60b262", "modalities": "85fd0565", "endpoints": "7a78c070", - "huggingface_downloads": "36013621", + "huggingface_downloads": "82b31198", "last_modified": "2d84b9f9" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablebeluga-13b.json b/packages/data/providers/stability/models/stablebeluga-13b.json index 981cd8967..783dd3771 100644 --- a/packages/data/providers/stability/models/stablebeluga-13b.json +++ b/packages/data/providers/stability/models/stablebeluga-13b.json @@ -19,7 +19,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 260, + "huggingface_downloads": 257, "last_modified": "2023-08-29", "_generated": { "name": "ebdd4163", @@ -34,8 +34,8 @@ "capabilities": "0fa77dc6", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "a4f23670", + "huggingface_downloads": "d96409bf", "last_modified": "cf47b6d1" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablebeluga-7b.json b/packages/data/providers/stability/models/stablebeluga-7b.json index e1ab2b25f..afb10158e 100644 --- a/packages/data/providers/stability/models/stablebeluga-7b.json +++ b/packages/data/providers/stability/models/stablebeluga-7b.json @@ -19,7 +19,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 251, + "huggingface_downloads": 248, "last_modified": "2023-08-29", "_generated": { "name": "c568803e", @@ -34,8 +34,8 @@ "capabilities": "0fa77dc6", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "19f3cd30", + "huggingface_downloads": "621bf66d", "last_modified": "cf47b6d1" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablebeluga2.json b/packages/data/providers/stability/models/stablebeluga2.json index b75b95be9..23c293b3d 100644 --- a/packages/data/providers/stability/models/stablebeluga2.json +++ b/packages/data/providers/stability/models/stablebeluga2.json @@ -18,7 +18,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 717, + "huggingface_downloads": 761, "last_modified": "2023-09-18", "_generated": { "name": "ba958057", @@ -32,8 +32,8 @@ "capabilities": "0fa77dc6", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "788d9869", + "huggingface_downloads": "88ae6372", "last_modified": "c9747a7f" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablecode-completion-alpha-3b-4k.json b/packages/data/providers/stability/models/stablecode-completion-alpha-3b-4k.json index c8ba93591..e8279f7a9 100644 --- a/packages/data/providers/stability/models/stablecode-completion-alpha-3b-4k.json +++ b/packages/data/providers/stability/models/stablecode-completion-alpha-3b-4k.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 1115, + "huggingface_downloads": 1092, "last_modified": "2023-08-08", "_generated": { "name": "0abfb02c", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "e19347e1", + "huggingface_downloads": "6a2feef8", "last_modified": "a4b79bfa" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablecode-completion-alpha-3b.json b/packages/data/providers/stability/models/stablecode-completion-alpha-3b.json index 6a16a391e..31bf1c357 100644 --- a/packages/data/providers/stability/models/stablecode-completion-alpha-3b.json +++ b/packages/data/providers/stability/models/stablecode-completion-alpha-3b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 408, + "huggingface_downloads": 385, "last_modified": "2023-08-08", "_generated": { "name": "046e9a2f", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "0d0fd7c6", + "huggingface_downloads": "dc912a25", "last_modified": "a4b79bfa" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablelm-2-12b-chat-gguf.json b/packages/data/providers/stability/models/stablelm-2-12b-chat-gguf.json index 2bc9f0b59..61003f021 100644 --- a/packages/data/providers/stability/models/stablelm-2-12b-chat-gguf.json +++ b/packages/data/providers/stability/models/stablelm-2-12b-chat-gguf.json @@ -23,7 +23,7 @@ }, "endpoints": ["chat_completions"], "tools": ["function_calling"], - "huggingface_downloads": 168, + "huggingface_downloads": 176, "last_modified": "2024-04-20", "_generated": { "name": "02178e15", @@ -40,8 +40,8 @@ "modalities": "68e53d93", "endpoints": "d8fa1080", "tools": "f0c1dc7e", - "huggingface_downloads": "006f52e9", + "huggingface_downloads": "38af8613", "last_modified": "fd79eb8a" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablelm-2-12b-chat.json b/packages/data/providers/stability/models/stablelm-2-12b-chat.json index 180018291..387bc7a0e 100644 --- a/packages/data/providers/stability/models/stablelm-2-12b-chat.json +++ b/packages/data/providers/stability/models/stablelm-2-12b-chat.json @@ -23,7 +23,7 @@ }, "endpoints": ["chat_completions"], "tools": ["function_calling"], - "huggingface_downloads": 266, + "huggingface_downloads": 260, "last_modified": "2024-05-20", "_generated": { "name": "f68e2426", @@ -40,8 +40,8 @@ "modalities": "68e53d93", "endpoints": "d8fa1080", "tools": "f0c1dc7e", - "huggingface_downloads": "f7664060", + "huggingface_downloads": "a4f23670", "last_modified": "fc4e65a1" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablelm-2-12b.json b/packages/data/providers/stability/models/stablelm-2-12b.json index 931364e97..014e63ec2 100644 --- a/packages/data/providers/stability/models/stablelm-2-12b.json +++ b/packages/data/providers/stability/models/stablelm-2-12b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 3144, + "huggingface_downloads": 3321, "last_modified": "2024-07-10", "_generated": { "name": "904c9bd9", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "a41b3bb3", + "huggingface_downloads": "3cfbdf46", "last_modified": "2d84b9f9" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablelm-2-1_6b-chat.json b/packages/data/providers/stability/models/stablelm-2-1_6b-chat.json index 682ab6ce2..07b8fe9f5 100644 --- a/packages/data/providers/stability/models/stablelm-2-1_6b-chat.json +++ b/packages/data/providers/stability/models/stablelm-2-1_6b-chat.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 843, + "huggingface_downloads": 867, "last_modified": "2024-06-03", "_generated": { "name": "77a80ba4", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "3d8e28ca", + "huggingface_downloads": "ede7e2b6", "last_modified": "90065f25" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablelm-2-1_6b.json b/packages/data/providers/stability/models/stablelm-2-1_6b.json index 812059d09..a211514b4 100644 --- a/packages/data/providers/stability/models/stablelm-2-1_6b.json +++ b/packages/data/providers/stability/models/stablelm-2-1_6b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 10285, + "huggingface_downloads": 10913, "last_modified": "2024-07-10", "_generated": { "name": "225475de", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "7e89a835", + "huggingface_downloads": "7a3189dc", "last_modified": "2d84b9f9" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablelm-2-zephyr-1_6b.json b/packages/data/providers/stability/models/stablelm-2-zephyr-1_6b.json index 36653be03..3a3b81838 100644 --- a/packages/data/providers/stability/models/stablelm-2-zephyr-1_6b.json +++ b/packages/data/providers/stability/models/stablelm-2-zephyr-1_6b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 3318, + "huggingface_downloads": 3299, "last_modified": "2024-06-03", "_generated": { "name": "66b2c37d", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "831b1ac5", + "huggingface_downloads": "7371364b", "last_modified": "90065f25" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablelm-3b-4e1t.json b/packages/data/providers/stability/models/stablelm-3b-4e1t.json index adc91146c..a1c4dc190 100644 --- a/packages/data/providers/stability/models/stablelm-3b-4e1t.json +++ b/packages/data/providers/stability/models/stablelm-3b-4e1t.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 93520, + "huggingface_downloads": 93032, "last_modified": "2024-03-07", "_generated": { "name": "66026194", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "ac78b098", + "huggingface_downloads": "a42b7cdd", "last_modified": "b151d9b5" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablelm-base-alpha-3b-v2.json b/packages/data/providers/stability/models/stablelm-base-alpha-3b-v2.json index d43e31da0..eb4307efb 100644 --- a/packages/data/providers/stability/models/stablelm-base-alpha-3b-v2.json +++ b/packages/data/providers/stability/models/stablelm-base-alpha-3b-v2.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 531, + "huggingface_downloads": 528, "last_modified": "2023-09-11", "_generated": { "name": "0dca166d", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "0fcbc61a", + "huggingface_downloads": "f4be0027", "last_modified": "aa23e1b4" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablelm-base-alpha-3b.json b/packages/data/providers/stability/models/stablelm-base-alpha-3b.json index d243410f0..d29c5748a 100644 --- a/packages/data/providers/stability/models/stablelm-base-alpha-3b.json +++ b/packages/data/providers/stability/models/stablelm-base-alpha-3b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 3011, + "huggingface_downloads": 2984, "last_modified": "2023-10-19", "_generated": { "name": "187d0d83", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "b1f62fa9", + "huggingface_downloads": "1c67df9e", "last_modified": "5e832b78" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablelm-base-alpha-7b.json b/packages/data/providers/stability/models/stablelm-base-alpha-7b.json index ab1376357..df6d9a6e3 100644 --- a/packages/data/providers/stability/models/stablelm-base-alpha-7b.json +++ b/packages/data/providers/stability/models/stablelm-base-alpha-7b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 999, + "huggingface_downloads": 974, "last_modified": "2023-10-19", "_generated": { "name": "aa206b67", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "b706835d", + "huggingface_downloads": "4311359e", "last_modified": "5e832b78" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablelm-tuned-alpha-3b.json b/packages/data/providers/stability/models/stablelm-tuned-alpha-3b.json index 2fe56e8ee..fbb1de68f 100644 --- a/packages/data/providers/stability/models/stablelm-tuned-alpha-3b.json +++ b/packages/data/providers/stability/models/stablelm-tuned-alpha-3b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 845, + "huggingface_downloads": 819, "last_modified": "2023-04-19", "_generated": { "name": "ff58b73f", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "b86e8d03", + "huggingface_downloads": "3b5dca50", "last_modified": "1ea09bfe" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablelm-tuned-alpha-7b.json b/packages/data/providers/stability/models/stablelm-tuned-alpha-7b.json index 01c99056b..3de6d2801 100644 --- a/packages/data/providers/stability/models/stablelm-tuned-alpha-7b.json +++ b/packages/data/providers/stability/models/stablelm-tuned-alpha-7b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 5838, + "huggingface_downloads": 5821, "last_modified": "2023-04-19", "_generated": { "name": "d4bd2c80", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "a91bc76c", + "huggingface_downloads": "926c11cc", "last_modified": "1ea09bfe" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/stablelm-zephyr-3b.json b/packages/data/providers/stability/models/stablelm-zephyr-3b.json index eb1d0fefb..772897add 100644 --- a/packages/data/providers/stability/models/stablelm-zephyr-3b.json +++ b/packages/data/providers/stability/models/stablelm-zephyr-3b.json @@ -21,7 +21,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 28453, + "huggingface_downloads": 28462, "last_modified": "2024-07-10", "_generated": { "name": "7d629ed3", @@ -37,8 +37,8 @@ "capabilities": "9c665f5d", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "8e9f2243", + "huggingface_downloads": "001d908c", "last_modified": "2d84b9f9" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/tiny-random-stablelm-2.json b/packages/data/providers/stability/models/tiny-random-stablelm-2.json index a93c31b1f..70638dada 100644 --- a/packages/data/providers/stability/models/tiny-random-stablelm-2.json +++ b/packages/data/providers/stability/models/tiny-random-stablelm-2.json @@ -18,7 +18,7 @@ "output": ["text"] }, "endpoints": ["chat_completions"], - "huggingface_downloads": 1405, + "huggingface_downloads": 1395, "last_modified": "2024-03-31", "_generated": { "name": "02988bf9", @@ -32,8 +32,8 @@ "capabilities": "0fa77dc6", "modalities": "68e53d93", "endpoints": "d8fa1080", - "huggingface_downloads": "3de2334a", + "huggingface_downloads": "14d9e800", "last_modified": "0ca5d11e" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/stability/models/triposr.json b/packages/data/providers/stability/models/triposr.json index d6cfb59cb..996d2f469 100644 --- a/packages/data/providers/stability/models/triposr.json +++ b/packages/data/providers/stability/models/triposr.json @@ -15,7 +15,7 @@ "vision": true, "fine_tuning": true }, - "huggingface_downloads": 189582, + "huggingface_downloads": 188532, "last_modified": "2024-08-09", "_generated": { "name": "deff3bf3", @@ -28,8 +28,8 @@ "open_weight": "b326b506", "tagline": "b8cff5fe", "capabilities": "ea60b262", - "huggingface_downloads": "03868a28", + "huggingface_downloads": "d2733e7b", "last_modified": "880765cb" }, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } diff --git a/packages/data/providers/vertex/models/veo-2.0-generate-001.json b/packages/data/providers/vertex/models/veo-2.0-generate-001.json index 51631de9a..0a3d3fa17 100644 --- a/packages/data/providers/vertex/models/veo-2.0-generate-001.json +++ b/packages/data/providers/vertex/models/veo-2.0-generate-001.json @@ -3,8 +3,8 @@ "name": "veo-2.0-generate-001", "created_by": "google", "source": "official", - "last_updated": "2026-06-29", - "status": "active", + "last_updated": "2026-06-30", + "status": "deprecated", "model_type": "video", "capabilities": { "streaming": true, @@ -23,7 +23,7 @@ "endpoints": ["generateContent", "streamGenerateContent"], "_generated": { "name": "89076b1f", - "status": "379ac110", + "status": "2e2f74dc", "model_type": "4d1b75ca", "capabilities": "fdff467b", "modalities": "85fd0565", @@ -33,11 +33,19 @@ "license": "9186c466", "open_weight": "68934a3e", "description": "a07bf735", - "tagline": "b16f53f3" + "tagline": "b16f53f3", + "deprecation_date": "ebf8cb32", + "successor": "712c232f" }, "family": "veo-2.0", "license": "proprietary", "open_weight": false, "description": "The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 2.0 This model is deprecated and will be shut down on **June 30, 2026**; migrate to Veo 3.1 Preview or the GA models available through the Gemini Enterprise Agent Platform to avoid service interruptions. Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows. Veo 2.0 is best for standard 1080p content creation, social media assets, and high-volume video tasks that prioritize reliable character consistency and predictable sub-second generation speeds.", - "tagline": "Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows." + "tagline": "Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows.", + "deprecation_date": "2026-06-30", + "successor": [ + "veo-3.1-generate-preview", + "the GA models on the Gemini Enterprise Agent Platf", + "m" + ] } diff --git a/packages/data/providers/vertex/models/veo-3.0-fast-generate-001.json b/packages/data/providers/vertex/models/veo-3.0-fast-generate-001.json index dd79971e3..b1688de5d 100644 --- a/packages/data/providers/vertex/models/veo-3.0-fast-generate-001.json +++ b/packages/data/providers/vertex/models/veo-3.0-fast-generate-001.json @@ -4,7 +4,7 @@ "created_by": "google", "source": "official", "family": "veo-3.0", - "status": "active", + "status": "deprecated", "model_type": "video", "license": "proprietary", "open_weight": false, @@ -15,11 +15,19 @@ "_generated": { "name": "7f1d98ab", "family": "adc96752", - "status": "379ac110", + "status": "2e2f74dc", "model_type": "4d1b75ca", "license": "9186c466", "open_weight": "68934a3e", - "modalities": "94e5e9ab" + "modalities": "94e5e9ab", + "deprecation_date": "ebf8cb32", + "successor": "b7b2c62c" }, - "last_updated": "2026-06-18" + "last_updated": "2026-06-30", + "deprecation_date": "2026-06-30", + "successor": [ + "veo-3.1-fast-generate-preview", + "the GA models on the Gemini Enterprise Agent Platf", + "m" + ] } diff --git a/packages/data/providers/vertex/models/veo-3.0-generate-001.json b/packages/data/providers/vertex/models/veo-3.0-generate-001.json index f018a6166..c41cedc60 100644 --- a/packages/data/providers/vertex/models/veo-3.0-generate-001.json +++ b/packages/data/providers/vertex/models/veo-3.0-generate-001.json @@ -4,7 +4,7 @@ "created_by": "google", "source": "official", "family": "veo-3.0", - "status": "active", + "status": "deprecated", "model_type": "video", "license": "proprietary", "open_weight": false, @@ -15,11 +15,19 @@ "_generated": { "name": "96869595", "family": "adc96752", - "status": "379ac110", + "status": "2e2f74dc", "model_type": "4d1b75ca", "license": "9186c466", "open_weight": "68934a3e", - "modalities": "94e5e9ab" + "modalities": "94e5e9ab", + "deprecation_date": "ebf8cb32", + "successor": "712c232f" }, - "last_updated": "2026-06-18" + "last_updated": "2026-06-30", + "deprecation_date": "2026-06-30", + "successor": [ + "veo-3.1-generate-preview", + "the GA models on the Gemini Enterprise Agent Platf", + "m" + ] } diff --git a/packages/data/src/data.ts b/packages/data/src/data.ts index f0f6dd694..004910287 100644 --- a/packages/data/src/data.ts +++ b/packages/data/src/data.ts @@ -15891,7 +15891,11 @@ export const providers: ProviderWithModels[] = [ ], "model_card_url": "https://huggingface.co/google/gemma-4-31B-it", "tokens_per_second": 1850, - "last_updated": "2026-06-29" + "last_updated": "2026-06-30", + "pricing": { + "input": 0.99, + "output": 1.49 + } }, { "id": "gpt-oss-120b", @@ -60551,7 +60555,9 @@ export const providers: ProviderWithModels[] = [ "chat_completions" ], "quantization": "fp8", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30", + "description": "Ornith-1.0-35B is DeepReinforce's open (MIT-licensed) agentic-coding model: an RL post-train of Qwen3.5-35B-A3B, a 35B-total / ~3B-active Mixture-of-Experts with hybrid Gated-DeltaNet attention. It targets state-of-the-art open-model coding-agent performance (SWE-bench Verified 75.6, Terminal-Bench 2.1 64.2) with a 262K-token context, thinking/reasoning mode, tool calling, and image + video understanding.", + "tagline": "Ornith-1.0-35B is DeepReinforce's open (MIT-licensed) agentic-coding model: an RL post-train of Qwen3.5-35B-A3B, a 35B-total / ~3B-active Mixture-of-Experts with hybrid Gated-DeltaNet attention." }, { "id": "deepseek-ai/DeepSeek-R1-0528-Turbo", @@ -62590,8 +62596,8 @@ export const providers: ProviderWithModels[] = [ ] }, "pricing": { - "input": 0.45, - "output": 2.1 + "input": 0.4, + "output": 2 }, "tools": [ "function_calling" @@ -62600,7 +62606,7 @@ export const providers: ProviderWithModels[] = [ "chat_completions" ], "quantization": "fp8", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "MiniMaxAI/MiniMax-M2.7", @@ -68036,6 +68042,35 @@ export const providers: ProviderWithModels[] = [ "last_seen_at": "2026-05-20", "last_updated": "2026-06-03" }, + { + "id": "bria/extract-object", + "name": "Extract Object", + "created_by": "bria", + "source": "official", + "description": "Bria Extract Object uses text prompts to isolate a selected object from an image and return it as an RGBA PNG with a transparent background.", + "status": "active", + "release_date": "2026-06-28", + "model_type": "image", + "page_url": "https://fal.run/bria/extract-object", + "tagline": "Bria Extract Object uses text prompts to isolate a selected object from an image and return it as an RGBA PNG with a transparent background.", + "capabilities": { + "vision": true + }, + "modalities": { + "input": [ + "text", + "image" + ], + "output": [ + "image" + ] + }, + "endpoints": [ + "images" + ], + "last_seen_at": "2026-06-29", + "last_updated": "2026-06-30" + }, { "id": "bria/fibo-bbq-preview/generate", "name": "Fibo Bbq Preview", @@ -75066,8 +75101,8 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "last_seen_at": "2026-01-26", - "last_updated": "2026-05-11" + "last_seen_at": "2026-06-30", + "last_updated": "2026-06-30" }, { "id": "fal-ai/flux-2/klein/realtime", @@ -79472,8 +79507,8 @@ export const providers: ProviderWithModels[] = [ "capabilities": { "vision": true }, - "last_seen_at": "2026-06-24", - "last_updated": "2026-06-29" + "last_seen_at": "2026-06-29", + "last_updated": "2026-06-30" }, { "id": "fal-ai/hyper3d/rodin/v2.5/text-to-3d/fast", @@ -79489,8 +79524,8 @@ export const providers: ProviderWithModels[] = [ "capabilities": { "vision": true }, - "last_seen_at": "2026-06-24", - "last_updated": "2026-06-29" + "last_seen_at": "2026-06-29", + "last_updated": "2026-06-30" }, { "id": "fal-ai/hyper3d/rodin/v2.5/text-to-3d", @@ -97630,8 +97665,8 @@ export const providers: ProviderWithModels[] = [ "model_type": "other", "page_url": "https://fal.run/fal-ai/topaz/upscale/video", "tagline": "Professional-grade video upscaling using Topaz technology.", - "last_seen_at": "2026-05-26", - "last_updated": "2026-06-03" + "last_seen_at": "2026-06-29", + "last_updated": "2026-06-30" }, { "id": "fal-ai/transpixar", @@ -101263,8 +101298,8 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "last_seen_at": "2026-04-28", - "last_updated": "2026-06-03" + "last_seen_at": "2026-06-30", + "last_updated": "2026-06-30" }, { "id": "fal-ai/zonos", @@ -114890,8 +114925,8 @@ export const providers: ProviderWithModels[] = [ "name": "veo-2.0-generate-001", "created_by": "google", "source": "official", - "last_updated": "2026-06-29", - "status": "active", + "last_updated": "2026-06-30", + "status": "deprecated", "model_type": "video", "capabilities": { "streaming": true, @@ -114923,7 +114958,13 @@ export const providers: ProviderWithModels[] = [ "page_url": "https://ai.google.dev/gemini-api/docs/models/veo-2.0-generate-001", "open_weight": false, "description": "The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 2.0 This model is deprecated and will be shut down on **June 30, 2026**; migrate to Veo 3.1 Preview or the GA models available through the Gemini Enterprise Agent Platform to avoid service interruptions. Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows. Veo 2.0 is best for standard 1080p content creation, social media assets, and high-volume video tasks that prioritize reliable character consistency and predictable sub-second generation speeds.", - "tagline": "Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows." + "tagline": "Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows.", + "deprecation_date": "2026-06-30", + "successor": [ + "veo-3.1-generate-preview", + "the GA models on the Gemini Enterprise Agent Platf", + "m" + ] }, { "id": "veo-3.0-fast-generate-001", @@ -114931,7 +114972,7 @@ export const providers: ProviderWithModels[] = [ "created_by": "google", "source": "official", "family": "veo-3.0", - "status": "active", + "status": "deprecated", "license": "proprietary", "model_type": "video", "modalities": { @@ -114943,7 +114984,13 @@ export const providers: ProviderWithModels[] = [ ] }, "open_weight": false, - "last_updated": "2026-06-18" + "last_updated": "2026-06-30", + "deprecation_date": "2026-06-30", + "successor": [ + "veo-3.1-fast-generate-preview", + "the GA models on the Gemini Enterprise Agent Platf", + "m" + ] }, { "id": "veo-3.0-fast-generate-preview", @@ -114973,7 +115020,7 @@ export const providers: ProviderWithModels[] = [ "created_by": "google", "source": "official", "family": "veo-3.0", - "status": "active", + "status": "deprecated", "license": "proprietary", "model_type": "video", "modalities": { @@ -114985,7 +115032,13 @@ export const providers: ProviderWithModels[] = [ ] }, "open_weight": false, - "last_updated": "2026-06-18" + "last_updated": "2026-06-30", + "deprecation_date": "2026-06-30", + "successor": [ + "veo-3.1-generate-preview", + "the GA models on the Gemini Enterprise Agent Platf", + "m" + ] }, { "id": "veo-3.0-generate-preview", @@ -116065,6 +116118,27 @@ export const providers: ProviderWithModels[] = [ ] } }, + { + "id": "deepreinforce-ai/Ornith-1.0-35B", + "name": "Ornith-1.0-35B", + "created_by": "deepreinforce-ai", + "source": "official", + "release_date": "2026-06-21", + "license": "mit", + "parameters": 0, + "page_url": "https://huggingface.co/deepreinforce-ai/Ornith-1.0-35B", + "architecture": "moe", + "capabilities": { + "streaming": true, + "tool_call": true, + "fine_tuning": true + }, + "open_weight": true, + "tools": [ + "function_calling" + ], + "last_updated": "2026-06-30" + }, { "id": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", "name": "DeepSeek-R1-0528-Qwen3-8B", @@ -167690,7 +167764,9 @@ export const providers: ProviderWithModels[] = [ "tools": [ "function_calling" ], - "last_updated": "2026-06-18" + "last_updated": "2026-06-30", + "status": "deprecated", + "deprecation_date": "9999-01-01" }, { "id": "poolside/laguna-xs.2", @@ -170699,10 +170775,10 @@ export const providers: ProviderWithModels[] = [ "name": "StepFun: Step 3.5 Flash", "created_by": "stepfun", "source": "official", - "last_updated": "2026-06-29", + "last_updated": "2026-06-30", "description": "Step 3.5 Flash is StepFun's most capable open-source foundation model.", "context_window": 262144, - "max_output_tokens": 16384, + "max_output_tokens": 65536, "modalities": { "input": [ "text" @@ -170720,7 +170796,7 @@ export const providers: ProviderWithModels[] = [ "fine_tuning": true }, "pricing": { - "input": 0.09, + "input": 0.1, "output": 0.3, "cached_input": 0.02 }, @@ -172271,14 +172347,14 @@ export const providers: ProviderWithModels[] = [ ] }, "pricing": { - "input": 0.98, - "output": 3.08, + "input": 0.975, + "output": 4.3, "cached_input": 0.182 }, "tools": [ "function_calling" ], - "last_updated": "2026-06-02", + "last_updated": "2026-06-30", "max_output_tokens": 131072 }, { @@ -172308,14 +172384,14 @@ export const providers: ProviderWithModels[] = [ ] }, "pricing": { - "input": 0.95, + "input": 0.94, "output": 3, "cached_input": 0.18 }, "tools": [ "function_calling" ], - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "z-ai/glm-5", @@ -183797,9 +183873,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 7, + "huggingface_downloads": 10, "last_modified": "2024-12-06", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "arcade100k", @@ -183844,9 +183920,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 38, + "huggingface_downloads": 36, "last_modified": "2023-11-08", - "last_updated": "2026-06-20" + "last_updated": "2026-06-30" }, { "id": "control-lora", @@ -183942,9 +184018,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 59, + "huggingface_downloads": 49, "last_modified": "2023-11-17", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "japanese-stable-clip-vit-l-16", @@ -183976,9 +184052,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 1660, + "huggingface_downloads": 1579, "last_modified": "2024-07-10", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "japanese-stable-diffusion-xl", @@ -184042,9 +184118,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 13, + "huggingface_downloads": 14, "last_modified": "2024-07-10", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "japanese-stablelm-2-base-1_6b", @@ -184141,9 +184217,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 48, + "huggingface_downloads": 45, "last_modified": "2024-04-26", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "japanese-stablelm-3b-4e1t-instruct", @@ -184174,9 +184250,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 148, + "huggingface_downloads": 147, "last_modified": "2024-04-26", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "japanese-stablelm-base-alpha-7b", @@ -184207,9 +184283,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 330, + "huggingface_downloads": 310, "last_modified": "2023-08-22", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "japanese-stablelm-base-beta-70b", @@ -184240,9 +184316,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 127, + "huggingface_downloads": 126, "last_modified": "2023-12-19", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "japanese-stablelm-base-beta-7b", @@ -184273,9 +184349,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 50, + "huggingface_downloads": 48, "last_modified": "2023-12-19", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "japanese-stablelm-base-gamma-7b", @@ -184339,9 +184415,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 40, + "huggingface_downloads": 39, "last_modified": "2023-12-19", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "japanese-stablelm-instruct-alpha-7b-v2", @@ -184372,9 +184448,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 40, + "huggingface_downloads": 38, "last_modified": "2023-10-06", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "japanese-stablelm-instruct-alpha-7b", @@ -184537,9 +184613,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 45, + "huggingface_downloads": 44, "last_modified": "2023-12-19", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "SAME-L", @@ -184569,9 +184645,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 6323, + "huggingface_downloads": 6334, "last_modified": "2026-06-24", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "SAME-S", @@ -184601,9 +184677,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 1549, + "huggingface_downloads": 1587, "last_modified": "2026-05-19", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "sd-turbo", @@ -184631,9 +184707,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "huggingface_downloads": 698263, + "huggingface_downloads": 684119, "last_modified": "2024-07-10", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "sd-vae-ft-ema-original", @@ -184680,9 +184756,9 @@ export const providers: ProviderWithModels[] = [ "page_url": "https://huggingface.co/stabilityai/sd-vae-ft-ema", "open_weight": true, "tagline": "Sd Vae Ft Ema is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 7037, + "huggingface_downloads": 6837, "last_modified": "2023-06-05", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "sd-vae-ft-mse-original", @@ -184729,9 +184805,9 @@ export const providers: ProviderWithModels[] = [ "page_url": "https://huggingface.co/stabilityai/sd-vae-ft-mse", "open_weight": true, "tagline": "Sd Vae Ft Mse is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 102468, + "huggingface_downloads": 102400, "last_modified": "2023-06-06", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "sd-x2-latent-upscaler", @@ -184746,9 +184822,9 @@ export const providers: ProviderWithModels[] = [ "page_url": "https://huggingface.co/stabilityai/sd-x2-latent-upscaler", "open_weight": true, "tagline": "Sd X2 Latent Upscaler is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 130271, + "huggingface_downloads": 129146, "last_modified": "2023-06-05", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "sdxl-turbo-ryzen-ai", @@ -184810,9 +184886,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "huggingface_downloads": 29, + "huggingface_downloads": 30, "last_modified": "2025-10-20", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "sdxl-turbo", @@ -184842,9 +184918,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "huggingface_downloads": 609582, + "huggingface_downloads": 597950, "last_modified": "2024-07-10", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "sdxl-vae", @@ -184859,9 +184935,9 @@ export const providers: ProviderWithModels[] = [ "page_url": "https://huggingface.co/stabilityai/sdxl-vae", "open_weight": true, "tagline": "Sdxl Vae is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 263433, + "huggingface_downloads": 259409, "last_modified": "2023-08-04", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "sp4d", @@ -184876,9 +184952,9 @@ export const providers: ProviderWithModels[] = [ "page_url": "https://huggingface.co/stabilityai/sp4d", "open_weight": true, "tagline": "Sp4d is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 15, + "huggingface_downloads": 12, "last_modified": "2025-11-05", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-audio-3-medium-base", @@ -184893,9 +184969,9 @@ export const providers: ProviderWithModels[] = [ "page_url": "https://huggingface.co/stabilityai/stable-audio-3-medium-base", "open_weight": true, "tagline": "Stable Audio 3 Medium Base is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 4312, + "huggingface_downloads": 4447, "last_modified": "2026-06-16", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-audio-3-medium", @@ -184910,9 +184986,9 @@ export const providers: ProviderWithModels[] = [ "page_url": "https://huggingface.co/stabilityai/stable-audio-3-medium", "open_weight": true, "tagline": "Stable Audio 3 Medium is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 59946, + "huggingface_downloads": 57092, "last_modified": "2026-06-16", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-audio-3-small-music-base", @@ -184927,9 +185003,9 @@ export const providers: ProviderWithModels[] = [ "page_url": "https://huggingface.co/stabilityai/stable-audio-3-small-music-base", "open_weight": true, "tagline": "Stable Audio 3 Small Music Base is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 1769, + "huggingface_downloads": 1747, "last_modified": "2026-05-20", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-audio-3-small-music", @@ -184944,9 +185020,9 @@ export const providers: ProviderWithModels[] = [ "page_url": "https://huggingface.co/stabilityai/stable-audio-3-small-music", "open_weight": true, "tagline": "Stable Audio 3 Small Music is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 15603, + "huggingface_downloads": 15375, "last_modified": "2026-05-19", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-audio-3-small-sfx-base", @@ -184961,9 +185037,9 @@ export const providers: ProviderWithModels[] = [ "page_url": "https://huggingface.co/stabilityai/stable-audio-3-small-sfx-base", "open_weight": true, "tagline": "Stable Audio 3 Small Sfx Base is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 1054, + "huggingface_downloads": 1064, "last_modified": "2026-05-20", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-audio-3-small-sfx", @@ -184978,9 +185054,9 @@ export const providers: ProviderWithModels[] = [ "page_url": "https://huggingface.co/stabilityai/stable-audio-3-small-sfx", "open_weight": true, "tagline": "Stable Audio 3 Small Sfx is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 12006, + "huggingface_downloads": 12045, "last_modified": "2026-05-19", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-audio-open-1.0", @@ -185002,9 +185078,9 @@ export const providers: ProviderWithModels[] = [ "tools": [ "function_calling" ], - "huggingface_downloads": 26532, + "huggingface_downloads": 25989, "last_modified": "2025-06-19", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-audio-open-small", @@ -185026,9 +185102,9 @@ export const providers: ProviderWithModels[] = [ "tools": [ "function_calling" ], - "huggingface_downloads": 2235, + "huggingface_downloads": 2169, "last_modified": "2025-05-27", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-cascade-prior", @@ -185058,9 +185134,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "huggingface_downloads": 789, + "huggingface_downloads": 796, "last_modified": "2024-03-14", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-cascade", @@ -185090,9 +185166,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "huggingface_downloads": 8252, + "huggingface_downloads": 8407, "last_modified": "2024-03-16", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-code-3b", @@ -185123,9 +185199,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 5918, + "huggingface_downloads": 5825, "last_modified": "2024-07-10", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-code-instruct-3b", @@ -185156,9 +185232,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 2335, + "huggingface_downloads": 2318, "last_modified": "2024-07-10", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-codec-speech-16k-base", @@ -185236,9 +185312,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "huggingface_downloads": 27, + "huggingface_downloads": 31, "last_modified": "2026-05-05", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-diffusion-3-medium-diffusers", @@ -185268,9 +185344,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "huggingface_downloads": 33289, + "huggingface_downloads": 32528, "last_modified": "2024-06-19", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-diffusion-3-medium-tensorrt", @@ -185332,9 +185408,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "huggingface_downloads": 3481, + "huggingface_downloads": 3491, "last_modified": "2024-08-12", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-diffusion-3-medium_amdgpu", @@ -185556,9 +185632,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "huggingface_downloads": 1469, + "huggingface_downloads": 1483, "last_modified": "2025-10-20", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-diffusion-3.5-large-turbo", @@ -185652,9 +185728,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "huggingface_downloads": 9, + "huggingface_downloads": 12, "last_modified": "2025-10-20", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-diffusion-3.5-medium", @@ -185701,9 +185777,9 @@ export const providers: ProviderWithModels[] = [ "page_url": "https://huggingface.co/stabilityai/stable-diffusion-x4-upscaler", "open_weight": true, "tagline": "Stable Diffusion X4 Upscaler is a Stability AI model published on the official Stability AI Hugging Face organization.", - "huggingface_downloads": 10328, + "huggingface_downloads": 10040, "last_modified": "2023-07-05", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-diffusion-xl-1.0-tensorrt", @@ -185733,9 +185809,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "huggingface_downloads": 275, + "huggingface_downloads": 276, "last_modified": "2025-10-20", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-diffusion-xl-base-0.9", @@ -185765,9 +185841,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "huggingface_downloads": 48, + "huggingface_downloads": 51, "last_modified": "2023-07-12", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-diffusion-xl-base-1.0", @@ -185797,9 +185873,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "huggingface_downloads": 1324082, + "huggingface_downloads": 1323188, "last_modified": "2023-10-30", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-diffusion-xl-refiner-0.9", @@ -185830,9 +185906,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "huggingface_downloads": 45, + "huggingface_downloads": 48, "last_modified": "2023-07-12", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-diffusion-xl-refiner-1.0", @@ -185863,9 +185939,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "images" ], - "huggingface_downloads": 163793, + "huggingface_downloads": 161798, "last_modified": "2023-09-25", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-fast-3d", @@ -185884,9 +185960,9 @@ export const providers: ProviderWithModels[] = [ "vision": true, "fine_tuning": true }, - "huggingface_downloads": 11960, + "huggingface_downloads": 11721, "last_modified": "2025-04-08", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-point-aware-3d", @@ -185971,9 +186047,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "video" ], - "huggingface_downloads": 7772, + "huggingface_downloads": 7755, "last_modified": "2024-07-10", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-video-diffusion-img2vid-xt", @@ -186004,9 +186080,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "video" ], - "huggingface_downloads": 218304, + "huggingface_downloads": 216367, "last_modified": "2024-07-10", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-video-diffusion-img2vid", @@ -186037,9 +186113,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "video" ], - "huggingface_downloads": 32007, + "huggingface_downloads": 31140, "last_modified": "2024-07-10", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stable-virtual-camera", @@ -186118,9 +186194,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 260, + "huggingface_downloads": 257, "last_modified": "2023-08-29", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "StableBeluga-7B", @@ -186149,9 +186225,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 251, + "huggingface_downloads": 248, "last_modified": "2023-08-29", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "StableBeluga1-Delta", @@ -186211,9 +186287,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 717, + "huggingface_downloads": 761, "last_modified": "2023-09-18", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stablecode-completion-alpha-3b-4k", @@ -186244,9 +186320,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 1115, + "huggingface_downloads": 1092, "last_modified": "2023-08-08", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stablecode-completion-alpha-3b", @@ -186277,9 +186353,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 408, + "huggingface_downloads": 385, "last_modified": "2023-08-08", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stablecode-instruct-alpha-3b", @@ -186347,9 +186423,9 @@ export const providers: ProviderWithModels[] = [ "tools": [ "function_calling" ], - "huggingface_downloads": 168, + "huggingface_downloads": 176, "last_modified": "2024-04-20", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stablelm-2-12b-chat", @@ -186384,9 +186460,9 @@ export const providers: ProviderWithModels[] = [ "tools": [ "function_calling" ], - "huggingface_downloads": 266, + "huggingface_downloads": 260, "last_modified": "2024-05-20", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stablelm-2-12b", @@ -186417,9 +186493,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 3144, + "huggingface_downloads": 3321, "last_modified": "2024-07-10", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stablelm-2-1_6b-chat", @@ -186450,9 +186526,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 843, + "huggingface_downloads": 867, "last_modified": "2024-06-03", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stablelm-2-1_6b", @@ -186483,9 +186559,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 10285, + "huggingface_downloads": 10913, "last_modified": "2024-07-10", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stablelm-2-zephyr-1_6b", @@ -186516,9 +186592,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 3318, + "huggingface_downloads": 3299, "last_modified": "2024-06-03", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stablelm-3b-4e1t", @@ -186549,9 +186625,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 93520, + "huggingface_downloads": 93032, "last_modified": "2024-03-07", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stablelm-base-alpha-3b-v2", @@ -186582,9 +186658,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 531, + "huggingface_downloads": 528, "last_modified": "2023-09-11", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stablelm-base-alpha-3b", @@ -186615,9 +186691,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 3011, + "huggingface_downloads": 2984, "last_modified": "2023-10-19", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stablelm-base-alpha-7b-v2", @@ -186681,9 +186757,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 999, + "huggingface_downloads": 974, "last_modified": "2023-10-19", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stablelm-tuned-alpha-3b", @@ -186714,9 +186790,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 845, + "huggingface_downloads": 819, "last_modified": "2023-04-19", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stablelm-tuned-alpha-7b", @@ -186747,9 +186823,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 5838, + "huggingface_downloads": 5821, "last_modified": "2023-04-19", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "stablelm-zephyr-3b", @@ -186780,9 +186856,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 28453, + "huggingface_downloads": 28462, "last_modified": "2024-07-10", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "sv3d", @@ -186877,9 +186953,9 @@ export const providers: ProviderWithModels[] = [ "endpoints": [ "chat_completions" ], - "huggingface_downloads": 1405, + "huggingface_downloads": 1395, "last_modified": "2024-03-31", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" }, { "id": "TripoSR", @@ -186898,9 +186974,9 @@ export const providers: ProviderWithModels[] = [ "vision": true, "fine_tuning": true }, - "huggingface_downloads": 189582, + "huggingface_downloads": 188532, "last_modified": "2024-08-09", - "last_updated": "2026-06-29" + "last_updated": "2026-06-30" } ] }, @@ -202628,8 +202704,8 @@ export const providers: ProviderWithModels[] = [ "name": "veo-2.0-generate-001", "created_by": "google", "source": "official", - "last_updated": "2026-06-29", - "status": "active", + "last_updated": "2026-06-30", + "status": "deprecated", "model_type": "video", "capabilities": { "streaming": true, @@ -202660,7 +202736,13 @@ export const providers: ProviderWithModels[] = [ "license": "proprietary", "open_weight": false, "description": "The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 2.0 This model is deprecated and will be shut down on **June 30, 2026**; migrate to Veo 3.1 Preview or the GA models available through the Gemini Enterprise Agent Platform to avoid service interruptions. Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows. Veo 2.0 is best for standard 1080p content creation, social media assets, and high-volume video tasks that prioritize reliable character consistency and predictable sub-second generation speeds.", - "tagline": "Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows." + "tagline": "Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows.", + "deprecation_date": "2026-06-30", + "successor": [ + "veo-3.1-generate-preview", + "the GA models on the Gemini Enterprise Agent Platf", + "m" + ] }, { "id": "veo-3.0-fast-generate-001", @@ -202668,7 +202750,7 @@ export const providers: ProviderWithModels[] = [ "created_by": "google", "source": "official", "family": "veo-3.0", - "status": "active", + "status": "deprecated", "model_type": "video", "license": "proprietary", "open_weight": false, @@ -202680,7 +202762,13 @@ export const providers: ProviderWithModels[] = [ "video" ] }, - "last_updated": "2026-06-18" + "last_updated": "2026-06-30", + "deprecation_date": "2026-06-30", + "successor": [ + "veo-3.1-fast-generate-preview", + "the GA models on the Gemini Enterprise Agent Platf", + "m" + ] }, { "id": "veo-3.0-fast-generate-preview", @@ -202710,7 +202798,7 @@ export const providers: ProviderWithModels[] = [ "created_by": "google", "source": "official", "family": "veo-3.0", - "status": "active", + "status": "deprecated", "model_type": "video", "license": "proprietary", "open_weight": false, @@ -202722,7 +202810,13 @@ export const providers: ProviderWithModels[] = [ "video" ] }, - "last_updated": "2026-06-18" + "last_updated": "2026-06-30", + "deprecation_date": "2026-06-30", + "successor": [ + "veo-3.1-generate-preview", + "the GA models on the Gemini Enterprise Agent Platf", + "m" + ] }, { "id": "veo-3.0-generate-preview", diff --git a/packages/npm/src/providers/cerebras.ts b/packages/npm/src/providers/cerebras.ts index b424263c0..e197b7c8f 100644 --- a/packages/npm/src/providers/cerebras.ts +++ b/packages/npm/src/providers/cerebras.ts @@ -3,6 +3,6 @@ import type { ProviderWithModels, Model } from '../types'; -export const provider: ProviderWithModels = {"id":"cerebras","name":"Cerebras","region":"US","headquarters":"Sunnyvale, CA","founded":2016,"url":"https://cerebras.ai","api_url":"https://api.cerebras.ai/v1","docs_url":"https://inference-docs.cerebras.ai","pricing_url":"https://cerebras.ai/pricing","description":"Ultra-fast inference powered by wafer-scale compute chips, offering the fastest LLM speeds.","type":"cloud","playground_url":"https://inference.cerebras.ai","openai_compatible":true,"free_tier":true,"models_url":"https://inference-docs.cerebras.ai/introduction","twitter_url":"https://x.com/CerebrasSystems","discord_url":"https://discord.com/invite/q6bZcMWJVu","blog_url":"https://www.cerebras.ai/blog","terms_url":"https://cloud.cerebras.ai/terms","support_url":"https://support.cerebras.net","icon":"\n \n \n","models":[{"id":"deepseek-r1-distill-llama-70b","name":"deepseek-r1-distill-llama-70b","created_by":"meta","source":"official","last_updated":"2026-03-23","family":"deepseek-r1","status":"deprecated","deprecation_date":"2025-08-12","model_type":"chat","successor":"Qwen 3 32B","modalities":{"input":["text"],"output":["text"]},"parameters":70,"open_weight":true},{"id":"gemma-4-31b","name":"Gemma 4 31B","created_by":"unknown","source":"official","family":"gemma-4","status":"preview","context_window":131000,"max_output_tokens":40000,"model_type":"chat","reasoning_tokens":true,"parameters":31,"open_weight":true,"capabilities":{"reasoning":true,"streaming":true,"structured_output":true,"tool_call":true,"prompt_caching":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"endpoints":["chat_completions","completions"],"tools":["function_calling"],"model_card_url":"https://huggingface.co/google/gemma-4-31B-it","tokens_per_second":1850,"last_updated":"2026-06-29"},{"id":"gpt-oss-120b","name":"OpenAI GPT OSS","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-oss","context_window":131000,"max_output_tokens":40000,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"prompt_caching":true,"json_mode":true,"fine_tuning":false,"vision":false,"batch":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.35,"output":0.75},"model_type":"chat","status":"active","endpoints":["chat_completions"],"model_card_url":"https://openai.com/index/gpt-oss-model-card/","tokens_per_second":3000,"parameters":120,"precision":"FP16/FP8 (weights only)","huggingface_url":"https://huggingface.co/openai/gpt-oss-120b","reasoning_tokens":true,"open_weight":true,"tools":["function_calling"],"description":"\\","tagline":"Most powerful open-weight model, fits into an H100 GPU","knowledge_cutoff":"2024-06","license":"apache-2.0"},{"id":"llama-3.3-70b","name":"llama-3.3-70b","created_by":"meta","source":"official","last_updated":"2026-06-03","family":"llama-3.3","status":"deprecated","deprecation_date":"2026-02-16","model_type":"chat","successor":"gpt-oss-120b","modalities":{"input":["text"],"output":["text"]},"parameters":70,"open_weight":true},{"id":"llama-4-maverick-17b-128e-instruct","name":"llama-4-maverick-17b-128e-instruct","created_by":"meta","source":"official","last_updated":"2026-06-03","family":"llama-4","status":"deprecated","deprecation_date":"2025-10-15","model_type":"chat","successor":"gpt-oss-120b","modalities":{"input":["text"],"output":["text"]},"parameters":17,"open_weight":true,"context_window":1048576,"max_output_tokens":16384,"license":"llama4","capabilities":{"streaming":true,"tool_call":true,"vision":true,"fine_tuning":true}},{"id":"llama-4-scout-17b-16e-instruct","name":"llama-4-scout-17b-16e-instruct","created_by":"meta","source":"official","last_updated":"2026-06-03","family":"llama-4","status":"deprecated","deprecation_date":"2025-11-03","model_type":"chat","successor":"gpt-oss-120b","modalities":{"input":["text"],"output":["text"]},"parameters":17,"open_weight":true,"context_window":1048576,"max_output_tokens":16384,"license":"llama4","capabilities":{"streaming":true,"tool_call":true,"vision":true,"fine_tuning":true}},{"id":"llama3.1-70b","name":"llama3.1-70b","created_by":"meta","source":"official","last_updated":"2026-06-03","status":"deprecated","deprecation_date":"2025-01-17","model_type":"chat","successor":"llama-3.3-70b","modalities":{"input":["text"],"output":["text"]},"parameters":70,"open_weight":true},{"id":"llama3.1-8b","name":"Llama 3.1 8B","created_by":"meta","source":"official","last_updated":"2026-06-03","context_window":32000,"max_output_tokens":8000,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.1,"output":0.1},"status":"deprecated","model_type":"chat","endpoints":["chat_completions","completions"],"model_card_url":"https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct","tokens_per_second":2200,"parameters":8,"precision":"FP","huggingface_url":"https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct","open_weight":true,"tools":["function_calling"],"deprecation_date":"2026-05-27","successor":"gpt-oss-120b"},{"id":"qwen-3-235b-a22b-instruct-2507","name":"Qwen 3 235B Instruct","created_by":"qwen","source":"official","last_updated":"2026-06-03","family":"qwen","context_window":131000,"max_output_tokens":40000,"alias":"qwen-3-235b-a22b-instruct","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"prompt_caching":true,"json_mode":true,"reasoning":true,"batch":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.6,"output":1.2},"model_type":"chat","status":"deprecated","endpoints":["chat_completions","completions"],"model_card_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507","tokens_per_second":1400,"parameters":235,"precision":"FP16/FP8 (weights only)","huggingface_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507","open_weight":true,"tools":["function_calling"],"deprecation_date":"2026-05-27","active_parameters":22,"successor":"gpt-oss-120b","license":"apache-2.0"},{"id":"qwen-3-235b-a22b-instruct","name":"Qwen 3 235B Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen","context_window":131000,"max_output_tokens":40000,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"prompt_caching":true,"json_mode":true,"reasoning":true,"batch":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.6,"output":1.2},"snapshots":["qwen-3-235b-a22b-instruct-2507"],"model_type":"chat","status":"preview","endpoints":["chat_completions","completions"],"model_card_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507","tokens_per_second":1400,"parameters":235,"precision":"FP16/FP8 (weights only)","huggingface_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507","open_weight":true,"tools":["function_calling"],"license":"apache-2.0","active_parameters":22},{"id":"qwen-3-235b-a22b-thinking-2507","name":"qwen-3-235b-a22b-thinking-2507","created_by":"qwen","source":"official","last_updated":"2026-06-03","family":"qwen","status":"deprecated","deprecation_date":"2025-11-14","model_type":"chat","successor":"gpt-oss-120b","modalities":{"input":["text"],"output":["text"]},"parameters":235,"active_parameters":22,"open_weight":true,"context_window":256000,"license":"apache-2.0","capabilities":{"streaming":true,"tool_call":true,"reasoning":true,"structured_output":true,"batch":true,"fine_tuning":true,"json_mode":true}},{"id":"qwen-3-235b-a22b","name":"qwen-3-235b-a22b","created_by":"qwen","source":"official","last_updated":"2026-03-23","family":"qwen","status":"deprecated","deprecation_date":"2025-07-29","model_type":"chat","successor":"Qwen 3 235B Instruct","modalities":{"input":["text"],"output":["text"]},"parameters":235,"active_parameters":22,"open_weight":true,"context_window":256000,"license":"apache-2.0","capabilities":{"streaming":true,"tool_call":true,"reasoning":true,"structured_output":true,"batch":true,"fine_tuning":true,"json_mode":true}},{"id":"qwen-3-32b","name":"qwen-3-32b","created_by":"qwen","source":"official","last_updated":"2026-06-03","family":"qwen","status":"deprecated","deprecation_date":"2026-02-16","model_type":"chat","successor":"gpt-oss-120b","modalities":{"input":["text"],"output":["text"]},"parameters":32,"open_weight":true,"context_window":256000,"license":"apache-2.0","capabilities":{"streaming":true,"reasoning":true,"tool_call":true,"structured_output":true,"batch":true,"fine_tuning":true,"json_mode":true}},{"id":"qwen-3-coder-480b","name":"qwen-3-coder-480b","created_by":"qwen","source":"official","last_updated":"2026-06-03","family":"qwen","status":"deprecated","deprecation_date":"2025-11-05","model_type":"chat","successor":"zai-glm-4.7","modalities":{"input":["text"],"output":["text"]},"parameters":480,"open_weight":true},{"id":"zai-glm-4.6","name":"zai-glm-4.6","created_by":"zhipu","source":"official","last_updated":"2026-06-03","status":"deprecated","deprecation_date":"2026-01-20","model_type":"chat","successor":"zai-glm-4.7","modalities":{"input":["text"],"output":["text"]},"open_weight":true},{"id":"zai-glm-4.7","name":"Z.ai GLM 4.7","created_by":"zhipu","source":"official","last_updated":"2026-06-03","context_window":131000,"max_output_tokens":40000,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"prompt_caching":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":2.25,"output":2.75},"status":"preview","model_type":"chat","endpoints":["chat_completions"],"model_card_url":"https://huggingface.co/zai-org/GLM-4.7","tokens_per_second":1000,"parameters":355,"precision":"FP16/FP8 (weights only)","huggingface_url":"https://huggingface.co/zai-org/GLM-4.7","reasoning_tokens":true,"open_weight":true,"tools":["function_calling"]}]}; +export const provider: ProviderWithModels = {"id":"cerebras","name":"Cerebras","region":"US","headquarters":"Sunnyvale, CA","founded":2016,"url":"https://cerebras.ai","api_url":"https://api.cerebras.ai/v1","docs_url":"https://inference-docs.cerebras.ai","pricing_url":"https://cerebras.ai/pricing","description":"Ultra-fast inference powered by wafer-scale compute chips, offering the fastest LLM speeds.","type":"cloud","playground_url":"https://inference.cerebras.ai","openai_compatible":true,"free_tier":true,"models_url":"https://inference-docs.cerebras.ai/introduction","twitter_url":"https://x.com/CerebrasSystems","discord_url":"https://discord.com/invite/q6bZcMWJVu","blog_url":"https://www.cerebras.ai/blog","terms_url":"https://cloud.cerebras.ai/terms","support_url":"https://support.cerebras.net","icon":"\n \n \n","models":[{"id":"deepseek-r1-distill-llama-70b","name":"deepseek-r1-distill-llama-70b","created_by":"meta","source":"official","last_updated":"2026-03-23","family":"deepseek-r1","status":"deprecated","deprecation_date":"2025-08-12","model_type":"chat","successor":"Qwen 3 32B","modalities":{"input":["text"],"output":["text"]},"parameters":70,"open_weight":true},{"id":"gemma-4-31b","name":"Gemma 4 31B","created_by":"unknown","source":"official","family":"gemma-4","status":"preview","context_window":131000,"max_output_tokens":40000,"model_type":"chat","reasoning_tokens":true,"parameters":31,"open_weight":true,"capabilities":{"reasoning":true,"streaming":true,"structured_output":true,"tool_call":true,"prompt_caching":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"endpoints":["chat_completions","completions"],"tools":["function_calling"],"model_card_url":"https://huggingface.co/google/gemma-4-31B-it","tokens_per_second":1850,"last_updated":"2026-06-30","pricing":{"input":0.99,"output":1.49}},{"id":"gpt-oss-120b","name":"OpenAI GPT OSS","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-oss","context_window":131000,"max_output_tokens":40000,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"prompt_caching":true,"json_mode":true,"fine_tuning":false,"vision":false,"batch":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.35,"output":0.75},"model_type":"chat","status":"active","endpoints":["chat_completions"],"model_card_url":"https://openai.com/index/gpt-oss-model-card/","tokens_per_second":3000,"parameters":120,"precision":"FP16/FP8 (weights only)","huggingface_url":"https://huggingface.co/openai/gpt-oss-120b","reasoning_tokens":true,"open_weight":true,"tools":["function_calling"],"description":"\\","tagline":"Most powerful open-weight model, fits into an H100 GPU","knowledge_cutoff":"2024-06","license":"apache-2.0"},{"id":"llama-3.3-70b","name":"llama-3.3-70b","created_by":"meta","source":"official","last_updated":"2026-06-03","family":"llama-3.3","status":"deprecated","deprecation_date":"2026-02-16","model_type":"chat","successor":"gpt-oss-120b","modalities":{"input":["text"],"output":["text"]},"parameters":70,"open_weight":true},{"id":"llama-4-maverick-17b-128e-instruct","name":"llama-4-maverick-17b-128e-instruct","created_by":"meta","source":"official","last_updated":"2026-06-03","family":"llama-4","status":"deprecated","deprecation_date":"2025-10-15","model_type":"chat","successor":"gpt-oss-120b","modalities":{"input":["text"],"output":["text"]},"parameters":17,"open_weight":true,"context_window":1048576,"max_output_tokens":16384,"license":"llama4","capabilities":{"streaming":true,"tool_call":true,"vision":true,"fine_tuning":true}},{"id":"llama-4-scout-17b-16e-instruct","name":"llama-4-scout-17b-16e-instruct","created_by":"meta","source":"official","last_updated":"2026-06-03","family":"llama-4","status":"deprecated","deprecation_date":"2025-11-03","model_type":"chat","successor":"gpt-oss-120b","modalities":{"input":["text"],"output":["text"]},"parameters":17,"open_weight":true,"context_window":1048576,"max_output_tokens":16384,"license":"llama4","capabilities":{"streaming":true,"tool_call":true,"vision":true,"fine_tuning":true}},{"id":"llama3.1-70b","name":"llama3.1-70b","created_by":"meta","source":"official","last_updated":"2026-06-03","status":"deprecated","deprecation_date":"2025-01-17","model_type":"chat","successor":"llama-3.3-70b","modalities":{"input":["text"],"output":["text"]},"parameters":70,"open_weight":true},{"id":"llama3.1-8b","name":"Llama 3.1 8B","created_by":"meta","source":"official","last_updated":"2026-06-03","context_window":32000,"max_output_tokens":8000,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.1,"output":0.1},"status":"deprecated","model_type":"chat","endpoints":["chat_completions","completions"],"model_card_url":"https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct","tokens_per_second":2200,"parameters":8,"precision":"FP","huggingface_url":"https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct","open_weight":true,"tools":["function_calling"],"deprecation_date":"2026-05-27","successor":"gpt-oss-120b"},{"id":"qwen-3-235b-a22b-instruct-2507","name":"Qwen 3 235B Instruct","created_by":"qwen","source":"official","last_updated":"2026-06-03","family":"qwen","context_window":131000,"max_output_tokens":40000,"alias":"qwen-3-235b-a22b-instruct","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"prompt_caching":true,"json_mode":true,"reasoning":true,"batch":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.6,"output":1.2},"model_type":"chat","status":"deprecated","endpoints":["chat_completions","completions"],"model_card_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507","tokens_per_second":1400,"parameters":235,"precision":"FP16/FP8 (weights only)","huggingface_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507","open_weight":true,"tools":["function_calling"],"deprecation_date":"2026-05-27","active_parameters":22,"successor":"gpt-oss-120b","license":"apache-2.0"},{"id":"qwen-3-235b-a22b-instruct","name":"Qwen 3 235B Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen","context_window":131000,"max_output_tokens":40000,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"prompt_caching":true,"json_mode":true,"reasoning":true,"batch":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.6,"output":1.2},"snapshots":["qwen-3-235b-a22b-instruct-2507"],"model_type":"chat","status":"preview","endpoints":["chat_completions","completions"],"model_card_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507","tokens_per_second":1400,"parameters":235,"precision":"FP16/FP8 (weights only)","huggingface_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507","open_weight":true,"tools":["function_calling"],"license":"apache-2.0","active_parameters":22},{"id":"qwen-3-235b-a22b-thinking-2507","name":"qwen-3-235b-a22b-thinking-2507","created_by":"qwen","source":"official","last_updated":"2026-06-03","family":"qwen","status":"deprecated","deprecation_date":"2025-11-14","model_type":"chat","successor":"gpt-oss-120b","modalities":{"input":["text"],"output":["text"]},"parameters":235,"active_parameters":22,"open_weight":true,"context_window":256000,"license":"apache-2.0","capabilities":{"streaming":true,"tool_call":true,"reasoning":true,"structured_output":true,"batch":true,"fine_tuning":true,"json_mode":true}},{"id":"qwen-3-235b-a22b","name":"qwen-3-235b-a22b","created_by":"qwen","source":"official","last_updated":"2026-03-23","family":"qwen","status":"deprecated","deprecation_date":"2025-07-29","model_type":"chat","successor":"Qwen 3 235B Instruct","modalities":{"input":["text"],"output":["text"]},"parameters":235,"active_parameters":22,"open_weight":true,"context_window":256000,"license":"apache-2.0","capabilities":{"streaming":true,"tool_call":true,"reasoning":true,"structured_output":true,"batch":true,"fine_tuning":true,"json_mode":true}},{"id":"qwen-3-32b","name":"qwen-3-32b","created_by":"qwen","source":"official","last_updated":"2026-06-03","family":"qwen","status":"deprecated","deprecation_date":"2026-02-16","model_type":"chat","successor":"gpt-oss-120b","modalities":{"input":["text"],"output":["text"]},"parameters":32,"open_weight":true,"context_window":256000,"license":"apache-2.0","capabilities":{"streaming":true,"reasoning":true,"tool_call":true,"structured_output":true,"batch":true,"fine_tuning":true,"json_mode":true}},{"id":"qwen-3-coder-480b","name":"qwen-3-coder-480b","created_by":"qwen","source":"official","last_updated":"2026-06-03","family":"qwen","status":"deprecated","deprecation_date":"2025-11-05","model_type":"chat","successor":"zai-glm-4.7","modalities":{"input":["text"],"output":["text"]},"parameters":480,"open_weight":true},{"id":"zai-glm-4.6","name":"zai-glm-4.6","created_by":"zhipu","source":"official","last_updated":"2026-06-03","status":"deprecated","deprecation_date":"2026-01-20","model_type":"chat","successor":"zai-glm-4.7","modalities":{"input":["text"],"output":["text"]},"open_weight":true},{"id":"zai-glm-4.7","name":"Z.ai GLM 4.7","created_by":"zhipu","source":"official","last_updated":"2026-06-03","context_window":131000,"max_output_tokens":40000,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"prompt_caching":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":2.25,"output":2.75},"status":"preview","model_type":"chat","endpoints":["chat_completions"],"model_card_url":"https://huggingface.co/zai-org/GLM-4.7","tokens_per_second":1000,"parameters":355,"precision":"FP16/FP8 (weights only)","huggingface_url":"https://huggingface.co/zai-org/GLM-4.7","reasoning_tokens":true,"open_weight":true,"tools":["function_calling"]}]}; export const models: Model[] = provider.models.map((m) => ({ ...m, provider: provider.id })); diff --git a/packages/npm/src/providers/deepinfra.ts b/packages/npm/src/providers/deepinfra.ts index a2840bd4c..e9d6d3f9d 100644 --- a/packages/npm/src/providers/deepinfra.ts +++ b/packages/npm/src/providers/deepinfra.ts @@ -3,6 +3,6 @@ import type { ProviderWithModels, Model } from '../types'; -export const provider: ProviderWithModels = {"id":"deepinfra","name":"DeepInfra","region":"US","headquarters":"Palo Alto, CA","founded":2022,"url":"https://deepinfra.com","api_url":"https://api.deepinfra.com/v1/openai","docs_url":"https://deepinfra.com/docs","pricing_url":"https://deepinfra.com/pricing","description":"Serverless inference cloud for open-weight LLMs, image, video, TTS, transcription, embedding, and reranker models with an OpenAI-compatible API.","type":"cloud","playground_url":"https://deepinfra.com/chat","status_url":"https://status.deepinfra.com","openai_compatible":true,"free_tier":false,"github_url":"https://github.com/deepinfra","models_url":"https://deepinfra.com/models","twitter_url":"https://x.com/DeepInfra","discord_url":"https://discord.gg/deepinfra","blog_url":"https://deepinfra.com/blog","terms_url":"https://deepinfra.com/terms","support_url":"https://deepinfra.com/contact","icon":"\n \n \n","models":[{"id":"ACE-Step/acestep-v15-xl-sft","name":"acestep-v15-xl-sft","created_by":"ace-step","source":"official","description":"ACE-Step v1.5 is a powerful open-source music foundation model that turns a text prompt into a complete song — vocals, lyrics, and instrumentation — at quality that rivals commercial tools. We run the high-quality XL checkpoint with its planning step (\"thinking\") on by default, so generations favor musical structure and coherence over raw speed.","status":"active","model_type":"chat","open_weight":true,"tagline":"ACE-Step v1.5 is a powerful open-source music foundation model that turns a text prompt into a complete song — vocals, lyrics, and instrumentation — at quality that rivals commercial tools.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing_notes":["$0.001 / second of audio"],"last_updated":"2026-06-18"},{"id":"allenai/Olmo-3.1-32B-Instruct","name":"Olmo-3.1-32B-Instruct","created_by":"allenai","source":"official","last_updated":"2026-04-26","family":"allenai","description":"Olmo is a series of Open language models, developed by Allen Institute for AI (Ai2), designed to enable the science of language models.","status":"active","model_type":"chat","context_window":65536,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.2,"output":0.6},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Olmo is a series of Open language models, developed by Allen Institute for AI (Ai2), designed to enable the science of language models."},{"id":"allenai/olmOCR-2-7B-1025","name":"olmOCR-2-7B-1025","created_by":"allenai","source":"official","last_updated":"2026-04-26","family":"allenai","description":"olmOCR is a specialized AI tool that converts PDF documents into clean, structured text while preserving important formatting and layout information. What makes olmOCR particularly valuable for developers is its ability to handle challenging PDFs that traditional OCR tools struggle with—including complex layouts, poor-quality scans, handwritten text, and documents with mixed content types. Built on a fine-tuned 7B vision-language model, olmOCR provides enterprise-grade PDF processing at a fra...","status":"active","model_type":"chat","context_window":16384,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.09,"output":0.19},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"olmOCR is a specialized AI tool that converts PDF documents into clean, structured text while preserving important formatting and layout information."},{"id":"anthropic/claude-3-7-sonnet-latest","name":"claude-3-7-sonnet-latest","created_by":"anthropic","source":"official","last_updated":"2026-04-26","family":"claude-sonnet","status":"active","model_type":"chat","context_window":200000,"open_weight":false,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":3.3,"output":16.5,"cached_input":0.33},"tools":["function_calling"],"endpoints":["chat_completions"]},{"id":"anthropic/claude-4-opus","name":"claude-4-opus","created_by":"anthropic","source":"official","last_updated":"2026-04-26","family":"claude-opus","description":"Anthropic’s most powerful model yet and the state-of-the-art coding model. It delivers sustained performance on long-running tasks that require focused effort and thousands of steps, significantly expanding what AI agents can solve. Claude Opus 4 is ideal for powering frontier agent products and features.","status":"active","model_type":"chat","context_window":200000,"open_weight":false,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":16.5,"output":82.5},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Anthropic’s most powerful model yet and the state-of-the-art coding model."},{"id":"anthropic/claude-4-sonnet","name":"claude-4-sonnet","created_by":"anthropic","source":"official","last_updated":"2026-04-26","family":"claude-sonnet","description":"Anthropic's mid-size model with superior intelligence for high-volume uses in coding, in-depth research, agents, & more.","status":"active","model_type":"chat","context_window":200000,"open_weight":false,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":3.3,"output":16.5},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Anthropic's mid-size model with superior intelligence for high-volume uses in coding, in-depth research, agents, & more."},{"id":"anthropic/claude-haiku-4-5","name":"claude-haiku-4-5","created_by":"anthropic","source":"official","family":"claude-haiku","description":"The next generation of Anthropic's fastest and most cost-effective model, optimal for use cases where speed and affordability matter.","status":"active","context_window":200000,"model_type":"chat","reasoning_tokens":true,"open_weight":false,"tagline":"The next generation of Anthropic's fastest and most cost-effective model, optimal for use cases where speed and affordability matter.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1,"output":5},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03","max_output_tokens":64000,"knowledge_cutoff":"2025-02","training_data_cutoff":"2025-07","license":"proprietary"},{"id":"anthropic/claude-opus-4-7","name":"claude-opus-4-7","created_by":"anthropic","source":"official","family":"claude-opus","description":"Anthropic's most capable production model yet, advancing performance across coding, enterprise workflows, and long-running agentic tasks.","status":"active","context_window":1000000,"model_type":"chat","reasoning_tokens":true,"open_weight":false,"tagline":"Anthropic's most capable production model yet, advancing performance across coding, enterprise workflows, and long-running agentic tasks.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5,"output":25},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03","max_output_tokens":128000,"knowledge_cutoff":"2026-01","training_data_cutoff":"2026-01","license":"proprietary"},{"id":"anthropic/claude-opus-4-8","name":"claude-opus-4-8","created_by":"anthropic","source":"official","family":"claude-opus","description":"Claude Opus 4.8 is our most intelligent Opus model and the best generally available model for coding and agents, with deeper reasoning for enterprise workflows.","status":"active","context_window":1000000,"model_type":"chat","reasoning_tokens":true,"open_weight":false,"tagline":"Claude Opus 4.8 is our most intelligent Opus model and the best generally available model for coding and agents, with deeper reasoning for enterprise workflows.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5,"output":25},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03","max_output_tokens":128000,"knowledge_cutoff":"2026-01","training_data_cutoff":"2026-01","license":"proprietary"},{"id":"anthropic/claude-sonnet-4-6","name":"claude-sonnet-4-6","created_by":"anthropic","source":"official","family":"claude-sonnet","description":"Claude Sonnet 4.6 delivers frontier intelligence at scale—built for coding, agents, and enterprise workflows.","status":"active","context_window":1000000,"model_type":"chat","reasoning_tokens":true,"open_weight":false,"tagline":"Claude Sonnet 4.6 delivers frontier intelligence at scale—built for coding, agents, and enterprise workflows.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":3,"output":15},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03","max_output_tokens":64000,"knowledge_cutoff":"2025-08","training_data_cutoff":"2026-01","license":"proprietary"},{"id":"BAAI/bge-base-en-v1.5","name":"bge-base-en-v1.5","created_by":"baai","source":"official","last_updated":"2026-04-26","family":"bge","description":"BGE embedding is a general Embedding Model. It is pre-trained using retromae and trained on large-scale pair data using contrastive learning. Note that the goal of pre-training is to reconstruct the text, and the pre-trained model cannot be used for similarity calculation directly, it needs to be fine-tuned","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"BGE embedding is a general Embedding Model."},{"id":"BAAI/bge-en-icl","name":"bge-en-icl","created_by":"baai","source":"official","last_updated":"2026-04-26","family":"bge","description":"A LLM-based embedding model with in-context learning capabilities that achieves SOTA performance on BEIR and AIR-Bench. It leverages few-shot examples to enhance task performance.","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"A LLM-based embedding model with in-context learning capabilities that achieves SOTA performance on BEIR and AIR-Bench."},{"id":"BAAI/bge-large-en-v1.5","name":"bge-large-en-v1.5","created_by":"baai","source":"official","last_updated":"2026-04-26","family":"bge","description":"BGE embedding is a general Embedding Model. It is pre-trained using retromae and trained on large-scale pair data using contrastive learning. Note that the goal of pre-training is to reconstruct the text, and the pre-trained model cannot be used for similarity calculation directly, it needs to be fine-tuned","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"BGE embedding is a general Embedding Model."},{"id":"BAAI/bge-m3-multi","name":"bge-m3-multi","created_by":"baai","source":"official","last_updated":"2026-04-26","family":"bge","description":"BGE-M3 is a multilingual text embedding model developed by BAAI, distinguished by its Multi-Linguality (supporting 100+ languages), Multi-Functionality (unified dense, multi-vector, and sparse retrieval), and Multi-Granularity (handling inputs from short queries to 8192-token documents). It achieves state-of-the-art retrieval performance across diverse benchmarks while maintaining a single model for multiple retrieval modes.","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"BGE-M3 is a multilingual text embedding model developed by BAAI, distinguished by its Multi-Linguality (supporting 100+ languages), Multi-Functionality (unified dense, multi-vector, and sparse retrieval), and Multi-Granularity (handling inputs from short queries to 8192-token documents)."},{"id":"BAAI/bge-m3","name":"bge-m3","created_by":"baai","source":"official","last_updated":"2026-04-26","family":"bge","description":"BGE-M3 is a versatile text embedding model that supports multi-functionality, multi-linguality, and multi-granularity, allowing it to perform dense retrieval, multi-vector retrieval, and sparse retrieval in over 100 languages and with input sizes up to 8192 tokens. The model can be used in a retrieval pipeline with hybrid retrieval and re-ranking to achieve higher accuracy and stronger generalization capabilities. BGE-M3 has shown state-of-the-art performance on several benchmarks, including ...","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"quantization":"fp32","tagline":"BGE-M3 is a versatile text embedding model that supports multi-functionality, multi-linguality, and multi-granularity, allowing it to perform dense retrieval, multi-vector retrieval, and sparse retrieval in over 100 languages and with input sizes up to 8192 tokens."},{"id":"black-forest-labs/FLUX-1-dev","name":"FLUX-1-dev","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux","description":"FLUX.1-dev is a state-of-the-art 12 billion parameter rectified flow transformer developed by Black Forest Labs. This model excels in text-to-image generation, providing highly accurate and detailed outputs. It is particularly well-regarded for its ability to follow complex prompts and generate anatomically accurate images, especially with challenging details like hands and faces.","status":"active","model_type":"image","open_weight":true,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0090 per image unit (1024x1024 default)"],"tagline":"FLUX.1-dev is a state-of-the-art 12 billion parameter rectified flow transformer developed by Black Forest Labs."},{"id":"black-forest-labs/FLUX-1-Redux-dev","name":"FLUX-1-Redux-dev","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux","description":"FLUX.1 Redux [dev] is an image variation generation adapter for all FLUX.1 base models. It enables users to refine images with slight variations and supports text-based restyling via API. Integrated with FLUX1.1 [pro] Ultra, it allows for high-quality 4-megapixel outputs. The model can be used with Diffusers in Python for efficient image generation. While powerful, it has ethical and factual limitations and is governed by a non-commercial license.","status":"active","model_type":"image","open_weight":true,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0120 per image unit (1024x1024 default)"],"tagline":"FLUX.1 Redux [dev] is an image variation generation adapter for all FLUX.1 base models."},{"id":"black-forest-labs/FLUX-1-schnell","name":"FLUX-1-schnell","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux","description":"FLUX.1 [schnell] is a 12 billion parameter rectified flow transformer capable of generating images from text descriptions. This model offers cutting-edge output quality and competitive prompt following, matching the performance of closed source alternatives. Trained using latent adversarial diffusion distillation, FLUX.1 [schnell] can generate high-quality images in only 1 to 4 steps.","status":"active","model_type":"image","open_weight":true,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0005 per image unit (1024x1024 default)"],"tagline":"FLUX.1 [schnell] is a 12 billion parameter rectified flow transformer capable of generating images from text descriptions."},{"id":"black-forest-labs/FLUX-1.1-pro","name":"FLUX-1.1-pro","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux","description":"Black Forest Labs' latest state-of-the art proprietary model sporting top of the line prompt following, visual quality, details and output diversity.","status":"active","model_type":"image","open_weight":false,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Black Forest Labs' latest state-of-the art proprietary model sporting top of the line prompt following, visual quality, details and output diversity."},{"id":"black-forest-labs/FLUX-2-dev","name":"FLUX-2-dev","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux-2","description":"Brand-new Flux2 Dev introduces a faster, more modular architecture for next-generation image generation pipelines. It delivers improved performance, cleaner control APIs, and a significantly more flexible development workflow for custom inference setups.","status":"active","model_type":"image","open_weight":true,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0100 per image unit (1024x1024 default)"],"tagline":"Brand-new Flux2 Dev introduces a faster, more modular architecture for next-generation image generation pipelines."},{"id":"black-forest-labs/FLUX-2-klein-4b","name":"FLUX-2-klein-4b","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux-2","description":"The fastest model of the Flux 2 family. Frontier visual intelligence — state-of-the-art image generation and editing from Black Forest Labs","status":"active","model_type":"image","open_weight":true,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0140 per image unit (1024x1024 default)"],"tagline":"The fastest model of the Flux 2 family."},{"id":"black-forest-labs/FLUX-2-klein-9b","name":"FLUX-2-klein-9b","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux-2","description":"The best quality-to-latency ratio, production apps model of the Flux 2 family. Frontier visual intelligence — state-of-the-art image generation and editing from Black Forest Labs","status":"active","model_type":"image","open_weight":true,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0150 per image unit (1024x1024 default)"],"tagline":"The best quality-to-latency ratio, production apps model of the Flux 2 family."},{"id":"black-forest-labs/FLUX-2-max","name":"FLUX-2-max","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux-2","description":"The new top-tier image model from Black Forest Labs, significantly pushing image quality and editing consistency","status":"active","model_type":"image","open_weight":false,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.1000 per image unit (0x0 default)"],"tagline":"The new top-tier image model from Black Forest Labs, significantly pushing image quality and editing consistency"},{"id":"black-forest-labs/FLUX-2-pro","name":"FLUX-2-pro","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux-2","description":"Multi-reference visual intelligence with unprecedented detail, color precision, and spatial reasoning. The most advanced image generation and editing model. Generate photorealistic images with precise control.","status":"active","model_type":"image","open_weight":false,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0150 per image unit (0x0 default)"],"tagline":"Multi-reference visual intelligence with unprecedented detail, color precision, and spatial reasoning."},{"id":"black-forest-labs/FLUX-pro","name":"FLUX-pro","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux","description":"Black Forest Labs' first flagship model based on Flux latent rectified flow transformers","status":"active","model_type":"image","open_weight":false,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0500 per image unit (0x0 default)"],"tagline":"Black Forest Labs' first flagship model based on Flux latent rectified flow transformers"},{"id":"black-forest-labs/FLUX.1-Kontext-dev","name":"FLUX.1-Kontext-dev","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux","description":"FLUX.1 Kontext [dev] is a 12-billion-parameter image editing model that transforms visuals based on natural language instructions. It allows highly consistent, multi-step edits and is released with open weights under a non-commercial license to empower artists and researchers.","status":"active","model_type":"image","open_weight":true,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0100 per image unit (1024x1024 default)"],"tagline":"FLUX.1 Kontext [dev] is a 12-billion-parameter image editing model that transforms visuals based on natural language instructions."},{"id":"bosonai/HiggsAudioV2.5","name":"HiggsAudioV2.5","created_by":"bosonai","source":"official","last_updated":"2026-04-26","family":"bosonai","description":"HiggsAudioV2.5 is a high-quality neural text-to-speech (TTS) model designed for natural-sounding voice generation across a wide range of use cases. It focuses on clarity, stable prosody, and consistent pacing, making it suitable for both short prompts and longer narration.","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$20.0000 per 1M input characters"],"tagline":"HiggsAudioV2.5 is a high-quality neural text-to-speech (TTS) model designed for natural-sounding voice generation across a wide range of use cases."},{"id":"Bria/blur_background","name":"blur_background","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria Blur Background softens and de-emphasizes image backgrounds while keeping the subject sharp and clear for professional-quality results. Trained fully on licensed data, it delivers safe, natural, and commercial-ready outputs.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria Blur Background softens and de-emphasizes image backgrounds while keeping the subject sharp and clear for professional-quality results."},{"id":"Bria/Bria-3.2-vector","name":"Bria-3.2-vector","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria 3.2 is the next-generation commercial-ready text-to-image model. With just 4 billion parameters, it provides exceptional aesthetics and text rendering, evaluated to be on par to leading open-source models, and outperforming other licensed models.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria 3.2 is the next-generation commercial-ready text-to-image model."},{"id":"Bria/Bria-3.2","name":"Bria-3.2","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria 3.2 is the next-generation commercial-ready text-to-image model. With just 4 billion parameters, it provides exceptional aesthetics and text rendering, evaluated to be on par to leading open-source models, and outperforming other licensed models.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria 3.2 is the next-generation commercial-ready text-to-image model."},{"id":"Bria/enhance","name":"enhance","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria Enhance improves overall image quality by sharpening details, balancing colors, and boosting clarity for crisp, professional visuals. Trained only on licensed data, it’s safe, reliable, and ready for commercial use.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria Enhance improves overall image quality by sharpening details, balancing colors, and boosting clarity for crisp, professional visuals."},{"id":"Bria/erase","name":"erase","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria Eraser enables precise removal of unwanted objects from images while maintaining high-quality outputs. Trained exclusively on licensed data for safe and risk-free commercial use","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria Eraser enables precise removal of unwanted objects from images while maintaining high-quality outputs."},{"id":"Bria/erase_foreground","name":"erase_foreground","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria Erase Foreground precisely removes main subjects or foreground objects from images. Built entirely on licensed data, it is safe and optimized for professional and commercial use.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria Erase Foreground precisely removes main subjects or foreground objects from images."},{"id":"Bria/expand","name":"expand","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria Expand expands images beyond their borders in high quality. Resizing the image by generating new pixels to expand to the desired aspect ratio. Trained exclusively on licensed data for safe and risk-free commercial use.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria Expand expands images beyond their borders in high quality."},{"id":"Bria/fibo","name":"fibo","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"FIBO is an open-source, JSON-native text-to-image model trained on detailed structured descriptions (over 1,000+ words per image), providing fine-grained control over light, composition, and camera parameters.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"FIBO is an open-source, JSON-native text-to-image model trained on detailed structured descriptions (over 1,000+ words per image), providing fine-grained control over light, composition, and camera pa"},{"id":"Bria/fibo_edit","name":"fibo_edit","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"🥳 For a limited time, Fibo Edit is free on DeepInfra 🥳 YOUR AI, YOUR RULES. Visual Generation for Production-Grade. FIBO Edit. An open-source image editing model with native masking and a lightweight 8B architecture.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"🥳 For a limited time, Fibo Edit is free on DeepInfra 🥳 YOUR AI, YOUR RULES."},{"id":"Bria/gen_fill","name":"gen_fill","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria GenFill enables high-quality object addition or visual transformation. Trained exclusively on licensed data for safe and risk-free commercial use.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria GenFill enables high-quality object addition or visual transformation."},{"id":"Bria/remove_background","name":"remove_background","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria RMBG 2.0 enables seamless removal of backgrounds from images, ideal for professional editing tasks. Trained exclusively on licensed data for safe and risk-free commercial use.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0180 per image unit (0x0 default)"],"tagline":"Bria RMBG 2.0 enables seamless removal of backgrounds from images, ideal for professional editing tasks."},{"id":"Bria/replace_background","name":"replace_background","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria Background Generation allows for efficient swapping of backgrounds in images via text prompts or reference image, delivering realistic and polished results. Trained exclusively on licensed data for safe and risk-free commercial use.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria Background Generation allows for efficient swapping of backgrounds in images via text prompts or reference image, delivering realistic and polished results."},{"id":"Bria/video_eraser","name":"video_eraser","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Remove unwanted objects or regions from video using a mask, reconstructs the background with intelligent content-aware fill.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Remove unwanted objects or regions from video using a mask, reconstructs the background with intelligent content-aware fill."},{"id":"Bria/video_foreground_mask","name":"video_foreground_mask","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Automatically identify and segment foreground objects across video frames and generate a mask. No prompts, just a video.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Automatically identify and segment foreground objects across video frames and generate a mask."},{"id":"Bria/video_increase_resolution","name":"video_increase_resolution","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Increase video resolution up to 8K with advanced AI upscaling. Bring your videos to the big screen, ready for the screens of tomorrow.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Increase video resolution up to 8K with advanced AI upscaling."},{"id":"Bria/video_mask_by_key_points","name":"video_mask_by_key_points","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Identify and segment objects across video frames using specific coordinate points. Just point in the right direction and the model will figure out by itself which object should be masked.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Identify and segment objects across video frames using specific coordinate points."},{"id":"Bria/video_mask_by_prompt","name":"video_mask_by_prompt","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Identify and segment objects across video frames using a text prompt. The easiest way to create a mask to modify your videos.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Identify and segment objects across video frames using a text prompt."},{"id":"Bria/video_remove_background","name":"video_remove_background","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Light and fast. Remove the background of your videos to bring the foreground elements to focus. No more unwanted distractions.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Light and fast."},{"id":"ByteDance/Seed-1.8","name":"Seed-1.8","created_by":"bytedance","source":"official","last_updated":"2026-04-26","family":"bytedance","description":"Optimized specifically for multimodal agent scenarios. It features enhanced agent capabilities, upgraded multimodal comprehension, and more flexible context management.","status":"active","model_type":"chat","context_window":256000,"reasoning_tokens":true,"open_weight":false,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":2,"cached_input":0.05},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Optimized specifically for multimodal agent scenarios."},{"id":"ByteDance/Seed-2.0-code","name":"Seed-2.0-code","created_by":"bytedance","source":"official","description":"A coding model optimized for real-world development environments, with reliable tool use in common IDEs such as Claude Code. It delivers strong front-end performance and supports Skills.","status":"active","context_window":256000,"model_type":"chat","reasoning_tokens":true,"license":"apache-2.0","open_weight":false,"tagline":"A coding model optimized for real-world development environments, with reliable tool use in common IDEs such as Claude Code.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.5,"output":3,"cached_input":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03"},{"id":"ByteDance/Seed-2.0-mini","name":"Seed-2.0-mini","created_by":"bytedance","source":"official","last_updated":"2026-04-26","family":"seed","description":"Built for low-latency, high-concurrency, cost-sensitive use cases, with flexible deployment, four-tier thinking, and multimodal","status":"active","model_type":"chat","context_window":256000,"reasoning_tokens":true,"open_weight":false,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.1,"output":0.4,"cached_input":0.02},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Built for low-latency, high-concurrency, cost-sensitive use cases, with flexible deployment, four-tier thinking, and multimodal"},{"id":"ByteDance/Seed-2.0-pro","name":"Seed-2.0-pro","created_by":"bytedance","source":"official","last_updated":"2026-04-26","family":"seed","description":"Built for the Agent era, it delivers stable performance in complex reasoning and long-horizon tasks, including multi-step planning, visual-text reasoning, video understanding, and advanced analysis.","status":"active","model_type":"chat","context_window":256000,"reasoning_tokens":true,"open_weight":false,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.5,"output":3,"cached_input":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Built for the Agent era, it delivers stable performance in complex reasoning and long-horizon tasks, including multi-step planning, visual-text reasoning, video understanding, and advanced analysis."},{"id":"ByteDance/Seedance-1.5-Pro","name":"Seedance-1.5-Pro","created_by":"bytedance","source":"official","last_updated":"2026-04-26","family":"bytedance","description":"ByteDance's Seedance 1.5 Pro is a professional video model using V2A native generation for integrated, synced audio-visual output, enhancing efficiency of professional video creation.","status":"active","model_type":"video","open_weight":false,"license":"apache-2.0","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"ByteDance's Seedance 1.5 Pro is a professional video model using V2A native generation for integrated, synced audio-visual output, enhancing efficiency of professional video creation."},{"id":"ByteDance/Seedance-2.0","name":"Seedance-2.0","created_by":"bytedance","source":"official","description":"A new-generation professional-grade multimodal video creation model developed, supports video generation with multimodal reference inputs including images, videos and audio.","status":"active","model_type":"video","license":"apache-2.0","open_weight":false,"tagline":"A new-generation professional-grade multimodal video creation model developed, supports video generation with multimodal reference inputs including images, videos and audio.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_updated":"2026-06-03","capabilities":{"vision":true,"fine_tuning":true}},{"id":"ByteDance/Seedream-4.5","name":"Seedream-4.5","created_by":"bytedance","source":"official","last_updated":"2026-04-26","family":"bytedance","description":"The latest image model, delivering better editing consistency, improved multi-image fusion, finer detail control, natural small text and faces, and harmonious, aesthetic visuals.","status":"active","model_type":"image","open_weight":false,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"The latest image model, delivering better editing consistency, improved multi-image fusion, finer detail control, natural small text and faces, and harmonious, aesthetic visuals."},{"id":"ByteDance/Seedream-4","name":"Seedream-4","created_by":"bytedance","source":"official","last_updated":"2026-04-26","family":"bytedance","description":"Seedream 4.0 is a SOTA multimodal image creation model built on leading architecture. It breaks through the boundaries of traditional text-to-image models by natively supporting text, single-image, and multi-image inputs. Users can freely combine text and images to achieve diverse creative modes within a single model—such as multi-image blending, image editing, and sequentially batch image generation, featuring subject consistency, making image creation more free and controllable.","status":"active","model_type":"image","open_weight":false,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Seedream 4.0 is a SOTA multimodal image creation model built on leading architecture."},{"id":"canopylabs/orpheus-3b-0.1-ft","name":"orpheus-3b-0.1-ft","created_by":"canopylabs","source":"official","last_updated":"2026-04-26","family":"canopylabs","description":"Orpheus TTS is a state-of-the-art, Llama-based Speech-LLM designed for high-quality, empathetic text-to-speech generation. This model has been finetuned to deliver human-level speech synthesis, achieving exceptional clarity, expressiveness, and real-time streaming performances.","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$7.0000 per 1M input characters"],"tagline":"Orpheus TTS is a state-of-the-art, Llama-based Speech-LLM designed for high-quality, empathetic text-to-speech generation."},{"id":"ClarityAI/creative","name":"creative","created_by":"clarityai","source":"official","last_updated":"2026-04-26","family":"clarityai","description":"ClarityAI/creative is an AI-powered image upscaler that enhances details, adds realism, and creatively modifies images to improve their quality and visual appeal.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0500 per image unit (0x0 default)"],"tagline":"ClarityAI/creative is an AI-powered image upscaler that enhances details, adds realism, and creatively modifies images to improve their quality and visual appeal."},{"id":"ClarityAI/crystal","name":"crystal","created_by":"clarityai","source":"official","last_updated":"2026-04-26","family":"clarityai","description":"ClarityAI/crystal is a specialized upscaler optimized for portraits, faces, and products, delivering high-precision enhancements with adjustable detail levels for sharp, natural results.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0500 per image unit (0x0 default)"],"tagline":"ClarityAI/crystal is a specialized upscaler optimized for portraits, faces, and products, delivering high-precision enhancements with adjustable detail levels for sharp, natural results."},{"id":"ClarityAI/flux","name":"flux","created_by":"clarityai","source":"official","last_updated":"2026-04-26","family":"flux","description":"ClarityAI/flux integrates the Flux AI model into the upscaling process, enabling high-resolution enhancements with superior face preservation and support for LoRAs to apply specific styles or identities.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.2000 per image unit (0x0 default)"],"tagline":"ClarityAI/flux integrates the Flux AI model into the upscaling process, enabling high-resolution enhancements with superior face preservation and support for LoRAs to apply specific styles or identiti"},{"id":"deepreinforce-ai/Ornith-1.0-35B","name":"Ornith-1.0-35B","created_by":"deepreinforce-ai","source":"official","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.14,"output":1,"cached_input":0.05},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","last_updated":"2026-06-29"},{"id":"deepseek-ai/DeepSeek-R1-0528-Turbo","name":"DeepSeek-R1-0528-Turbo","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-r1","description":"The DeepSeek R1 0528 turbo model is a state of the art reasoning model that can generate very quick responses","status":"active","model_type":"chat","context_window":32768,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1,"output":3},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"The DeepSeek R1 0528 turbo model is a state of the art reasoning model that can generate very quick responses"},{"id":"deepseek-ai/DeepSeek-R1-0528","name":"DeepSeek-R1-0528","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-r1","description":"The DeepSeek R1 model has undergone a minor version upgrade, with the current version being DeepSeek-R1-0528.","status":"active","model_type":"chat","context_window":163840,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.5,"output":2.15,"cached_input":0.35},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"The DeepSeek R1 model has undergone a minor version upgrade, with the current version being DeepSeek-R1-0528."},{"id":"deepseek-ai/DeepSeek-R1-Distill-Llama-70B","name":"DeepSeek-R1-Distill-Llama-70B","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"llama","description":"DeepSeek-R1-Distill-Llama-70B is a highly efficient language model that leverages knowledge distillation to achieve state-of-the-art performance. This model distills the reasoning patterns of larger models into a smaller, more agile architecture, resulting in exceptional results on benchmarks like AIME 2024, MATH-500, and LiveCodeBench. With 70 billion parameters, DeepSeek-R1-Distill-Llama-70B offers a unique balance of accuracy and efficiency, making it an ideal choice for a wide range of na...","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"license":"deepseek","capabilities":{"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.7,"output":0.8},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"DeepSeek-R1-Distill-Llama-70B is a highly efficient language model that leverages knowledge distillation to achieve state-of-the-art performance."},{"id":"deepseek-ai/DeepSeek-V3-0324","name":"DeepSeek-V3-0324","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-v3","description":"DeepSeek-V3-0324, a strong Mixture-of-Experts (MoE) language model with 671B total parameters with 37B activated for each token, an improved iteration over DeepSeek-V3.","status":"active","model_type":"chat","context_window":163840,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.2,"output":0.77,"cached_input":0.135},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"DeepSeek-V3-0324, a strong Mixture-of-Experts (MoE) language model with 671B total parameters with 37B activated for each token, an improved iteration over DeepSeek-V3."},{"id":"deepseek-ai/DeepSeek-V3.1-Terminus","name":"DeepSeek-V3.1-Terminus","created_by":"deepseek","source":"official","last_updated":"2026-06-03","family":"deepseek-v3","description":"DeepSeek-V3.1 Terminus is an update to DeepSeek V3.1 that maintains the model's original capabilities while addressing issues reported by users, including language consistency and agent capabilities, further optimizing the model's performance in coding and search agents. It is a large hybrid reasoning model (671B parameters, 37B active) that supports both thinking and non-thinking modes. It extends the DeepSeek-V3 base with a two-phase long-context training process. Users can control the reas...","status":"active","model_type":"chat","context_window":163840,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.27,"output":0.95,"cached_input":0.13},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"DeepSeek-V3.1 Terminus is an update to DeepSeek V3.1 that maintains the model's original capabilities while addressing issues reported by users, including language consistency and agent capabilities, further optimizing the model's performance in coding and search agents."},{"id":"deepseek-ai/DeepSeek-V3.1","name":"DeepSeek-V3.1","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-v3","description":"DeepSeek-V3.1 is post-trained on the top of DeepSeek-V3.1-Base, which is built upon the original V3 base checkpoint through a two-phase long context extension approach, following the methodology outlined in the original DeepSeek-V3 report. We have expanded our dataset by collecting additional long documents and substantially extending both training phases. The 32K extension phase has been increased 10-fold to 630B tokens, while the 128K extension phase has been extended by 3.3x to 209B tokens...","status":"active","model_type":"chat","context_window":163840,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.21,"output":0.79,"cached_input":0.13},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"DeepSeek-V3.1 is post-trained on the top of DeepSeek-V3.1-Base, which is built upon the original V3 base checkpoint through a two-phase long context extension approach, following the methodology outlined in the original DeepSeek-V3 report."},{"id":"deepseek-ai/DeepSeek-V3.2","name":"DeepSeek-V3.2","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-v3","description":"DeepSeek-V3.2 is a large language model designed to harmonize high computational efficiency with strong reasoning and agentic tool-use performance. It introduces DeepSeek Sparse Attention (DSA), a fine-grained sparse attention mechanism that reduces training and inference cost while preserving quality in long-context scenarios. A scalable reinforcement learning post-training framework further improves reasoning, with reported performance in the GPT-5 class, and the model has demonstrated gold...","status":"active","model_type":"chat","context_window":163840,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.26,"output":0.38,"cached_input":0.13},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"DeepSeek-V3.2 is a large language model designed to harmonize high computational efficiency with strong reasoning and agentic tool-use performance."},{"id":"deepseek-ai/DeepSeek-V3","name":"DeepSeek-V3","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-v3","description":"DeepSeek-V3, a strong Mixture-of-Experts (MoE) language model with 671B total parameters with 37B activated for each token. To achieve efficient inference and cost-effective training, DeepSeek-V3 adopts Multi-head Latent Attention (MLA) and DeepSeekMoE architectures, which were thoroughly validated in DeepSeek-V2.","status":"active","model_type":"chat","context_window":163840,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.32,"output":0.89},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"DeepSeek-V3, a strong Mixture-of-Experts (MoE) language model with 671B total parameters with 37B activated for each token."},{"id":"deepseek-ai/DeepSeek-V4-Flash","name":"DeepSeek-V4-Flash","created_by":"deepseek","source":"official","last_updated":"2026-06-03","family":"deepseek-v4","description":"DeepSeek V4 Flash is an efficiency-focused MoE model with 284B total parameters (13B active) and a 1M-token context window. It's tuned for fast inference and high-throughput use cases while still holding up on reasoning and coding tasks.","status":"active","model_type":"chat","context_window":1048576,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.1,"output":0.2,"cached_input":0.02},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"DeepSeek V4 Flash is an efficiency-focused MoE model with 284B total parameters (13B active) and a 1M-token context window.","reasoning_tokens":true,"max_output_tokens":384000},{"id":"deepseek-ai/DeepSeek-V4-Pro","name":"DeepSeek-V4-Pro","created_by":"deepseek","source":"official","last_updated":"2026-06-03","family":"deepseek-v4","description":"DeepSeek V4 Pro is an MoE model with 1.6T total parameters (49B active) and a 1M-token context window. It's built for advanced reasoning, coding, and long-running agent tasks, and performs well on knowledge, math, and software engineering benchmarks.","status":"active","model_type":"chat","context_window":1048576,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1.3,"output":2.6,"cached_input":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"DeepSeek V4 Pro is an MoE model with 1.6T total parameters (49B active) and a 1M-token context window.","max_output_tokens":384000},{"id":"deepseek-ai/Janus-Pro-1B","name":"Janus-Pro-1B","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-ai","description":"Janus-Pro is a novel autoregressive framework that unifies multimodal understanding and generation. It addresses the limitations of previous approaches by decoupling visual encoding into separate pathways, while still utilizing a single, unified transformer architecture for processing. The decoupling not only alleviates the conflict between the visual encoder’s roles in understanding and generation, but also enhances the framework’s flexibility. Janus-Pro surpasses previous unified model and ...","status":"active","model_type":"image","open_weight":true,"license":"deepseek","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0005 per image unit (0x0 default)"],"tagline":"Janus-Pro is a novel autoregressive framework that unifies multimodal understanding and generation."},{"id":"deepseek-ai/Janus-Pro-7B","name":"Janus-Pro-7B","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-ai","description":"Janus-Pro is a novel autoregressive framework that unifies multimodal understanding and generation. It addresses the limitations of previous approaches by decoupling visual encoding into separate pathways, while still utilizing a single, unified transformer architecture for processing. The decoupling not only alleviates the conflict between the visual encoder’s roles in understanding and generation, but also enhances the framework’s flexibility. Janus-Pro surpasses previous unified model and ...","status":"active","model_type":"image","open_weight":true,"license":"deepseek","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0020 per image unit (0x0 default)"],"tagline":"Janus-Pro is a novel autoregressive framework that unifies multimodal understanding and generation."},{"id":"FastVideo/LTX-2.3-Distilled-Diffusers","name":"LTX-2.3-Distilled-Diffusers","created_by":"fastvideo","source":"official","description":"A fast, step-distilled build of Lightricks' LTX-2.3 diffusion-transformer video model (distilled by FastVideo). Generates high-fidelity text-to-video and image-to-video in just a few denoising steps.","status":"active","model_type":"video","open_weight":true,"tagline":"A fast, step-distilled build of Lightricks' LTX-2.3 diffusion-transformer video model (distilled by FastVideo).","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_updated":"2026-06-29"},{"id":"FastVideo/LTX2-Distilled-Diffusers","name":"LTX2-Distilled-Diffusers","created_by":"fastvideo","source":"official","description":"LTX-2 is a DiT-based audio-video foundation model designed to generate synchronized video and audio within a single model. It brings together the core building blocks of modern video generation, with open weights and a focus on practical, local execution.","status":"active","model_type":"video","open_weight":true,"tagline":"LTX-2 is a DiT-based audio-video foundation model designed to generate synchronized video and audio within a single model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_updated":"2026-06-03"},{"id":"google/embeddinggemma-300m","name":"embeddinggemma-300m","created_by":"google","source":"official","last_updated":"2026-06-29","family":"embed","description":"EmbeddingGemma is a 300M parameter multilingual open embedding model from Google DeepMind, designed for efficient deployment even on low-resource devices, producing high-quality text vector representations for tasks such as search, classification, clustering, and semantic similarity.","status":"active","model_type":"embed","open_weight":true,"license":"gemma","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"ChatGPT said: EmbeddingGemma is a 300M parameter multilingual open embedding model from Google DeepMind, designed for efficient deployment even on low-resource devices, producing high-quality text vec"},{"id":"google/gemini-2.5-flash","name":"gemini-2.5-flash","created_by":"google","source":"official","last_updated":"2026-04-26","family":"gemini-2.5","description":"Gemini 2.5 Flash is Google's latest thinking model, designed to tackle increasingly complex problems. It's capable of reasoning through their thoughts before responding, resulting in enhanced performance and improved accuracy. Gemini 2.5 Flash: best for balancing reasoning and speed.","status":"active","model_type":"chat","context_window":1000000,"reasoning_tokens":true,"open_weight":false,"license":"gemma","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.3,"output":2.5},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Gemini 2.5 Flash is Google's latest thinking model, designed to tackle increasingly complex problems.","max_output_tokens":65536,"knowledge_cutoff":"2025-01"},{"id":"google/gemini-2.5-pro","name":"gemini-2.5-pro","created_by":"google","source":"official","last_updated":"2026-04-26","family":"gemini-2.5","description":"Gemini 2.5 Pro is Google's the most advanced thinking model, designed to tackle increasingly complex problems. Gemini 2.5 Pro leads common benchmarks by meaningful margins and showcases strong reasoning and code capabilities. Gemini 2.5 models are thinking models, capable of reasoning through their thoughts before responding, resulting in enhanced performance and improved accuracy. The Gemini 2.5 Pro model is now available on DeepInfra.","status":"active","model_type":"chat","context_window":1000000,"reasoning_tokens":true,"open_weight":false,"license":"gemma","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":10},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Gemini 2.5 Pro is Google's the most advanced thinking model, designed to tackle increasingly complex problems.","max_output_tokens":65536,"knowledge_cutoff":"2025-01"},{"id":"google/gemini-3-pro-image","name":"gemini-3-pro-image","created_by":"google","source":"official","family":"gemini-3","description":"Nano Banana Pro (Gemini 3 Pro Image) is designed to tackle the most challenging image generation by incorporating state-of-the-art reasoning capabilities. It is the best model for complex and multi-turn image generation and editing.","status":"active","model_type":"image","license":"gemma","open_weight":false,"tagline":"Nano Banana Pro (Gemini 3 Pro Image) is designed to tackle the most challenging image generation by incorporating state-of-the-art reasoning capabilities.","capabilities":{"streaming":true,"fine_tuning":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_updated":"2026-06-03","context_window":65536,"max_output_tokens":32768,"knowledge_cutoff":"2025-01"},{"id":"google/gemini-3.1-flash-lite","name":"gemini-3.1-flash-lite","created_by":"google","source":"official","family":"gemini-3.1","description":"Bring any idea to life with state-of-the-art reasoning to help you learn, build, and plan anything. Best for high-volume tasks that need efficiency and intelligence.","status":"active","context_window":1000000,"model_type":"chat","reasoning_tokens":true,"license":"gemma","open_weight":false,"tagline":"Bring any idea to life with state-of-the-art reasoning to help you learn, build, and plan anything.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":1.5},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03","max_output_tokens":65536,"knowledge_cutoff":"2025-01"},{"id":"google/gemini-3.1-pro","name":"gemini-3.1-pro","created_by":"google","source":"official","family":"gemini-3.1","description":"Bring any idea to life with state-of-the-art reasoning to help you learn, build, and plan anything. Best for complex tasks and bringing creative concepts to life.","status":"active","context_window":1000000,"model_type":"chat","reasoning_tokens":true,"license":"gemma","open_weight":false,"tagline":"Bring any idea to life with state-of-the-art reasoning to help you learn, build, and plan anything.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":2,"output":12},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03"},{"id":"google/gemini-3.5-flash","name":"gemini-3.5-flash","created_by":"google","source":"official","family":"gemini-3.5","description":"Gemini 3.5 Flash delivers near-Pro intelligence at Flash-tier cost and speed: Pro-level coding proficiency, parallel agentic execution, all at a much lower price.","status":"active","context_window":1000000,"model_type":"chat","reasoning_tokens":true,"license":"gemma","open_weight":false,"tagline":"Gemini 3.5 Flash delivers near-Pro intelligence at Flash-tier cost and speed: Pro-level coding proficiency, parallel agentic execution, all at a much lower price.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.5,"output":9},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03","max_output_tokens":65536,"knowledge_cutoff":"2025-01"},{"id":"google/gemma-3-12b-it","name":"gemma-3-12b-it","created_by":"google","source":"official","last_updated":"2026-06-10","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3-12B is Google's latest open source model, successor to Gemma 2","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"license":"gemma","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.05,"output":0.15},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs."},{"id":"google/gemma-3-27b-it","name":"gemma-3-27b-it","created_by":"google","source":"official","last_updated":"2026-04-26","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3 27B is Google's latest open source model, successor to Gemma 2","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"license":"gemma","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.08,"output":0.16},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs."},{"id":"google/gemma-3-4b-it","name":"gemma-3-4b-it","created_by":"google","source":"official","last_updated":"2026-06-10","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3-12B is Google's latest open source model, successor to Gemma 2","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"license":"gemma","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.05,"output":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs."},{"id":"google/gemma-4-26B-A4B-it","name":"gemma-4-26B-A4B-it","created_by":"google","source":"official","last_updated":"2026-04-26","family":"gemma-4","description":"Efficient, MoE variant of Gemma 4. Gemma is a family of open models built by Google DeepMind. Gemma 4 models are multimodal, handling text and image input and generating text output.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"gemma","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.07,"output":0.34},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Efficient, MoE variant of Gemma 4."},{"id":"google/gemma-4-31B-it-turbo","name":"gemma-4-31B-it-turbo","created_by":"google","source":"official","family":"gemma-4","description":"Gemma is a family of open models built by Google DeepMind. Gemma 4 models are multimodal, handling text and image input and generating text output.","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"license":"gemma","open_weight":true,"tagline":"Gemma is a family of open models built by Google DeepMind.","capabilities":{"tool_call":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.12,"output":0.37},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","last_updated":"2026-06-03"},{"id":"google/gemma-4-31B-it","name":"gemma-4-31B-it","created_by":"google","source":"official","last_updated":"2026-04-26","family":"gemma-4","description":"Gemma is a family of open models built by Google DeepMind. Gemma 4 models are multimodal, handling text and image input and generating text output.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"gemma","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.13,"output":0.38},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Gemma is a family of open models built by Google DeepMind."},{"id":"google/veo-3.0-fast","name":"veo-3.0-fast","created_by":"google","source":"official","last_updated":"2026-04-26","family":"veo-3.0","description":"Veo 3 Fast is a speed-optimized version of the Veo 3 model, designed for rapid video creation. While maintaining high quality, it delivers results in a fraction of the time, making it ideal for quick iterations and dynamic content generation.","status":"active","model_type":"video","open_weight":false,"license":"gemma","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Veo 3 Fast is a speed-optimized version of the Veo 3 model, designed for rapid video creation."},{"id":"google/veo-3.0","name":"veo-3.0","created_by":"google","source":"official","last_updated":"2026-04-26","family":"veo-3.0","description":"Veo 3 is a state-of-the-art text-to-video model from Google that generates high-fidelity, cinematic videos with synchronized audio from a simple text prompt. It excels at creating realistic and imaginative scenes with a deep understanding of natural language and visual dynamics.","status":"active","model_type":"video","open_weight":false,"license":"gemma","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Veo 3 is a state-of-the-art text-to-video model from Google that generates high-fidelity, cinematic videos with synchronized audio from a simple text prompt."},{"id":"google/veo-3.1-fast","name":"veo-3.1-fast","created_by":"google","source":"official","last_updated":"2026-04-26","family":"veo-3.1","description":"Veo 3.1 is the latest text-to-video model from Google that generates high-fidelity, cinematic videos with synchronized audio from a simple text prompt. It excels at creating realistic and imaginative scenes with a deep understanding of natural language and visual dynamics.","status":"active","model_type":"video","open_weight":false,"license":"gemma","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Veo 3.1 is the latest text-to-video model from Google that generates high-fidelity, cinematic videos with synchronized audio from a simple text prompt."},{"id":"google/veo-3.1","name":"veo-3.1","created_by":"google","source":"official","last_updated":"2026-04-26","family":"veo-3.1","description":"Veo 3.1 is the latest text-to-video model from Google that generates high-fidelity, cinematic videos with synchronized audio from a simple text prompt. It excels at creating realistic and imaginative scenes with a deep understanding of natural language and visual dynamics.","status":"active","model_type":"video","open_weight":false,"license":"gemma","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Veo 3.1 is the latest text-to-video model from Google that generates high-fidelity, cinematic videos with synchronized audio from a simple text prompt."},{"id":"Gryphe/MythoMax-L2-13b","name":"MythoMax-L2-13b","created_by":"gryphe","source":"official","last_updated":"2026-04-26","family":"gryphe","status":"active","model_type":"chat","context_window":4096,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.4,"output":0.4},"endpoints":["chat_completions"],"quantization":"fp16"},{"id":"hexgrad/Kokoro-82M","name":"Kokoro-82M","created_by":"hexgrad","source":"official","last_updated":"2026-04-26","family":"hexgrad","description":"Kokoro is an open-weight TTS model with 82 million parameters. Despite its lightweight architecture, it delivers comparable quality to larger models while being significantly faster and more cost-efficient. With Apache-licensed weights, Kokoro can be deployed anywhere from production environments to personal projects.","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$0.6200 per 1M input characters"],"tagline":"Kokoro is an open-weight TTS model with 82 million parameters."},{"id":"intfloat/e5-base-v2","name":"e5-base-v2","created_by":"intfloat","source":"official","last_updated":"2026-04-26","family":"e5","description":"Text Embeddings by Weakly-Supervised Contrastive Pre-training. Model has 24 layers and 1024 out dim.","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"Text Embeddings by Weakly-Supervised Contrastive Pre-training."},{"id":"intfloat/e5-large-v2","name":"e5-large-v2","created_by":"intfloat","source":"official","last_updated":"2026-04-26","family":"e5","description":"Text Embeddings by Weakly-Supervised Contrastive Pre-training. Model has 24 layers and 1024 out dim.","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"Text Embeddings by Weakly-Supervised Contrastive Pre-training."},{"id":"intfloat/multilingual-e5-large-instruct","name":"multilingual-e5-large-instruct","created_by":"intfloat","source":"official","last_updated":"2026-04-26","family":"e5","description":"The Multilingual-E5 models, initialized from XLM-RoBERTa, support up to 512 tokens per input — any longer text will be silently truncated. To ensure optimal performance, always prefix inputs with “query:” or “passage:”, as the model was explicitly trained with this format.","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The Multilingual-E5 models, initialized from XLM-RoBERTa, support up to 512 tokens per input — any longer text will be silently truncated."},{"id":"intfloat/multilingual-e5-large","name":"multilingual-e5-large","created_by":"intfloat","source":"official","last_updated":"2026-04-26","family":"e5","description":"The Multilingual-E5-large model is a 24-layer text embedding model with an embedding size of 1024, trained on a mixture of multilingual datasets and supporting 100 languages.","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"quantization":"fp32","tagline":"The Multilingual-E5-large model is a 24-layer text embedding model with an embedding size of 1024, trained on a mixture of multilingual datasets and supporting 100 languages."},{"id":"inworld-ai/inworld-tts-1.5-max","name":"inworld-tts-1.5-max","created_by":"inworld-ai","source":"official","last_updated":"2026-04-26","family":"inworld-ai","description":"High-quality multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages. Supports voice cloning, word-level timestamps, and streaming. Optimized for natural, expressive speech with <250ms time-to-first-audio.","status":"active","model_type":"tts","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$50.0000 per 1M input characters"],"tagline":"High-quality multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages."},{"id":"inworld-ai/inworld-tts-1.5-mini","name":"inworld-tts-1.5-mini","created_by":"inworld-ai","source":"official","last_updated":"2026-04-26","family":"inworld-ai","description":"Fast multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages. Supports voice cloning, word-level timestamps, and streaming. Optimized for low-latency applications with <130ms time-to-first-audio.","status":"active","model_type":"tts","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$25.0000 per 1M input characters"],"tagline":"Fast multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages."},{"id":"inworld-ai/realtime-tts-1.5-max","name":"realtime-tts-1.5-max","created_by":"inworld-ai","source":"official","description":"High-quality multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages. Supports voice cloning, word-level timestamps, and streaming. Optimized for natural, expressive speech with <250ms time-to-first-audio.","status":"active","model_type":"tts","open_weight":false,"tagline":"High-quality multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$50.0000 per 1M input characters"],"last_updated":"2026-06-03"},{"id":"inworld-ai/realtime-tts-1.5-mini","name":"realtime-tts-1.5-mini","created_by":"inworld-ai","source":"official","description":"Fast multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages. Supports voice cloning, word-level timestamps, and streaming. Optimized for low-latency applications with <130ms time-to-first-audio.","status":"active","model_type":"tts","open_weight":false,"tagline":"Fast multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$25.0000 per 1M input characters"],"last_updated":"2026-06-03"},{"id":"inworld-ai/realtime-tts-2","name":"realtime-tts-2","created_by":"inworld-ai","source":"official","description":"Realtime TTS 2.0 is a low-latency text-to-speech model with natural language steering, allowing you to control tone and emotion directly in the prompt (e.g., “[be happy and upbeat] Hello!”). It supports cross-lingual voices and multiple languages, enabling the same voice to speak consistently across different languages. This is an early access preview ahead of full launch, with ongoing improvements to voice quality and steering.","status":"active","model_type":"tts","open_weight":false,"tagline":"Realtime TTS 2.0 is a low-latency text-to-speech model with natural language steering, allowing you to control tone and emotion directly in the prompt (e.g., “[be happy and upbeat] Hello!”).","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$35.0000 per 1M input characters"],"last_updated":"2026-06-03"},{"id":"meta-llama/Llama-3.2-11B-Vision-Instruct","name":"Llama-3.2-11B-Vision-Instruct","created_by":"meta","source":"official","last_updated":"2026-06-10","family":"Llama-3.2","description":"Llama 3.2 11B Vision is a multimodal model with 11 billion parameters, designed to handle tasks combining visual and textual data. It excels in tasks such as image captioning and visual question answering, bridging the gap between language generation and visual reasoning. Pre-trained on a massive dataset of image-text pairs, it performs well in complex, high-accuracy image analysis. Its ability to integrate visual understanding with language processing makes it an ideal solution for industrie...","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.345,"output":0.345},"endpoints":["chat_completions"],"quantization":"fp8","license":"llama","tagline":"Llama 3.2 11B Vision is a multimodal model with 11 billion parameters, designed to handle tasks combining visual and textual data.","max_output_tokens":131072,"knowledge_cutoff":"2023-12","parameters":11},{"id":"meta-llama/Llama-3.3-70B-Instruct-Turbo","name":"Llama-3.3-70B-Instruct-Turbo","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"Llama-3.3","description":"Llama 3.3-70B Turbo is a highly optimized version of the Llama 3.3-70B model, utilizing FP8 quantization to deliver significantly faster inference speeds with a minor trade-off in accuracy. The model is designed to be helpful, safe, and flexible, with a focus on responsible deployment and mitigating potential risks such as bias, toxicity, and misinformation. It achieves state-of-the-art performance on various benchmarks, including conversational tasks, language translation, and text generation.","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.1,"output":0.32},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","license":"llama","tagline":"Llama 3.3-70B Turbo is a highly optimized version of the Llama 3.3-70B model, utilizing FP8 quantization to deliver significantly faster inference speeds with a minor trade-off in accuracy."},{"id":"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8","name":"Llama-4-Maverick-17B-128E-Instruct-FP8","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"Llama-4","description":"The Llama 4 collection of models are natively multimodal AI models that enable text and multimodal experiences. These models leverage a mixture-of-experts architecture to offer industry-leading performance in text and image understanding. Llama 4 Maverick, a 17 billion parameter model with 128 experts","status":"active","model_type":"chat","context_window":1048576,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.15,"output":0.6},"endpoints":["chat_completions"],"quantization":"fp8","license":"llama","tagline":"The Llama 4 collection of models are natively multimodal AI models that enable text and multimodal experiences.","max_output_tokens":16384,"parameters":402},{"id":"meta-llama/Llama-4-Scout-17B-16E-Instruct","name":"Llama-4-Scout-17B-16E-Instruct","created_by":"meta","source":"official","last_updated":"2026-06-10","family":"Llama-4","description":"The Llama 4 collection of models are natively multimodal AI models that enable text and multimodal experiences. These models leverage a mixture-of-experts architecture to offer industry-leading performance in text and image understanding. Llama 4 Scout, a 17 billion parameter model with 16 experts","status":"active","model_type":"chat","context_window":327680,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.1,"output":0.3},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","license":"llama","tagline":"The Llama 4 collection of models are natively multimodal AI models that enable text and multimodal experiences.","max_output_tokens":16384,"parameters":109},{"id":"meta-llama/Llama-Guard-4-12B","name":"Llama-Guard-4-12B","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"llama-guard","description":"Llama Guard 4 is a natively multimodal safety classifier with 12 billion parameters trained jointly on text and multiple images. Llama Guard 4 is a dense architecture pruned from the Llama 4 Scout pre-trained model and fine-tuned for content safety classification. Similar to previous versions, it can be used to classify content in both LLM inputs (prompt classification) and in LLM responses (response classification). It itself acts as an LLM: it generates text in its output that indicates whe...","status":"active","model_type":"chat","context_window":163840,"open_weight":true,"capabilities":{"vision":true,"streaming":true,"fine_tuning":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.18,"output":0.18},"endpoints":["chat_completions"],"quantization":"bfloat16","license":"llama","tagline":"Llama Guard 4 is a natively multimodal safety classifier with 12 billion parameters trained jointly on text and multiple images.","parameters":12},{"id":"meta-llama/Meta-Llama-3-8B-Instruct","name":"Meta-Llama-3-8B-Instruct","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"Llama-3","description":"Meta developed and released the Meta Llama 3 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8 and 70B sizes.","status":"active","model_type":"chat","context_window":8192,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.03,"output":0.04},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","license":"llama","tagline":"Meta developed and released the Meta Llama 3 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8 and 70B sizes.","max_output_tokens":8192,"parameters":8},{"id":"meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo","name":"Meta-Llama-3.1-70B-Instruct-Turbo","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"Llama-3.1","description":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.4,"output":0.4},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","license":"llama","tagline":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes"},{"id":"meta-llama/Meta-Llama-3.1-70B-Instruct","name":"Meta-Llama-3.1-70B-Instruct","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"Llama-3.1","description":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.4,"output":0.4},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","license":"llama","tagline":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes"},{"id":"meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo","name":"Meta-Llama-3.1-8B-Instruct-Turbo","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"Llama-3.1","description":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"tool_call":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.02,"output":0.03},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","license":"llama","tagline":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes"},{"id":"meta-llama/Meta-Llama-3.1-8B-Instruct","name":"Meta-Llama-3.1-8B-Instruct","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"Llama-3.1","description":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.02,"output":0.05},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","license":"llama","tagline":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes"},{"id":"microsoft/phi-4","name":"phi-4","created_by":"microsoft","source":"official","last_updated":"2026-04-26","family":"phi-4","description":"Phi-4 is a model built upon a blend of synthetic datasets, data from filtered public domain websites, and acquired academic books and Q&A datasets. The goal of this approach was to ensure that small capable models were trained with data focused on high quality and advanced reasoning.","status":"active","model_type":"chat","context_window":16384,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.07,"output":0.14},"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"Phi-4 is a model built upon a blend of synthetic datasets, data from filtered public domain websites, and acquired academic books and Q&A datasets."},{"id":"MiniMaxAI/MiniMax-M2.5","name":"MiniMax-M2.5","created_by":"minimax","source":"official","last_updated":"2026-04-26","family":"minimax","description":"MiniMax M2.5 is SOTA in coding, agentic tool use and search, office work, and a range of other economically valuable tasks, boasting scores of 80.2% in SWE-Bench Verified, 51.3% in Multi-SWE-Bench, and 76.3% in BrowseComp (with context management).","status":"active","model_type":"chat","context_window":196608,"reasoning_tokens":true,"open_weight":true,"license":"minimax","capabilities":{"tool_call":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.15,"output":1.15,"cached_input":0.03},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"MiniMax M2.5 is SOTA in coding, agentic tool use and search, office work, and a range of other economically valuable tasks, boasting scores of 80.2% in SWE-Bench Verified, 51.3% in Multi-SWE-Bench, an"},{"id":"MiniMaxAI/MiniMax-M2.7-Turbo","name":"MiniMax-M2.7-Turbo","created_by":"minimax","source":"official","family":"minimax","description":"Speed-optimized MiniMax-M2.7","status":"active","context_window":196608,"model_type":"chat","reasoning_tokens":true,"license":"minimax","open_weight":false,"tagline":"Speed-optimized MiniMax-M2.7","capabilities":{"tool_call":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.45,"output":2.1},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","last_updated":"2026-06-29"},{"id":"MiniMaxAI/MiniMax-M2.7","name":"MiniMax-M2.7","created_by":"minimax","source":"official","family":"minimax","description":"MiniMax-M2.7 is MiniMax's first model deeply participating in its own evolution. M2.7 is capable of building complex agent harnesses and completing highly elaborate productivity tasks, leveraging Agent Teams, complex Skills, and dynamic tool search.","status":"active","context_window":196608,"model_type":"chat","reasoning_tokens":true,"license":"minimax","open_weight":true,"tagline":"MiniMax-M2.7 is MiniMax's first model deeply participating in its own evolution.","capabilities":{"tool_call":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.25,"output":1,"cached_input":0.05},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","last_updated":"2026-06-18"},{"id":"mistralai/Mistral-Nemo-Instruct-2407","name":"Mistral-Nemo-Instruct-2407","created_by":"mistral","source":"official","last_updated":"2026-04-26","family":"mistral","description":"12B model trained jointly by Mistral AI and NVIDIA, it significantly outperforms existing models smaller or similar in size.","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.02,"output":0.04},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"12B model trained jointly by Mistral AI and NVIDIA, it significantly outperforms existing models smaller or similar in size."},{"id":"mistralai/Mistral-Small-24B-Instruct-2501","name":"Mistral-Small-24B-Instruct-2501","created_by":"mistral","source":"official","last_updated":"2026-04-26","family":"mistral","description":"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks. Released under the Apache 2.0 license, it features both pre-trained and instruction-tuned versions designed for efficient local deployment. The model achieves 81% accuracy on the MMLU benchmark and performs competitively with larger models like Llama 3.3 70B and Qwen 32B, while operating at three times the speed on equivalent hardware.","status":"active","model_type":"chat","context_window":32768,"open_weight":true,"license":"apache-2.0","capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.05,"output":0.08},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks."},{"id":"mistralai/Mistral-Small-3.2-24B-Instruct-2506","name":"Mistral-Small-3.2-24B-Instruct-2506","created_by":"mistral","source":"official","last_updated":"2026-04-26","family":"mistral","description":"Mistral-Small-3.2-24B-Instruct is a drop-in upgrade over the 3.1 release, with markedly better instruction following, roughly half the infinite-generation errors, and a more robust function-calling interface—while otherwise matching or slightly improving on all previous text and vision benchmarks.","status":"active","model_type":"chat","context_window":128000,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.075,"output":0.2},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Mistral-Small-3.2-24B-Instruct is a drop-in upgrade over the 3.1 release, with markedly better instruction following, roughly half the infinite-generation errors, and a more robust function-calling in"},{"id":"mistralai/Mixtral-8x7B-Instruct-v0.1","name":"Mixtral-8x7B-Instruct-v0.1","created_by":"mistral","source":"official","last_updated":"2026-04-26","family":"mixtral","description":"Mixtral is mixture of expert large language model (LLM) from Mistral AI. This is state of the art machine learning model using a mixture 8 of experts (MoE) 7b models. During inference 2 expers are selected. This architecture allows large models to be fast and cheap at inference. The Mixtral-8x7B outperforms Llama 2 70B on most benchmarks.","status":"active","model_type":"chat","context_window":32768,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.54,"output":0.54},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Mixtral is mixture of expert large language model (LLM) from Mistral AI."},{"id":"mistralai/Voxtral-Mini-3B-2507","name":"Voxtral-Mini-3B-2507","created_by":"mistral","source":"official","last_updated":"2026-04-26","family":"mistralai","description":"Voxtral Mini is an enhancement of Ministral 3B, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance. It excels at speech transcription, translation and audio understanding.","status":"active","model_type":"transcription","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"quantization":"bf16","tagline":"Voxtral Mini is an enhancement of Ministral 3B, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance."},{"id":"mistralai/Voxtral-Small-24B-2507","name":"Voxtral-Small-24B-2507","created_by":"mistral","source":"official","last_updated":"2026-04-26","family":"mistralai","description":"Voxtral Small is an enhancement of Mistral Small 3, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance. It excels at speech transcription, translation and audio understanding.","status":"active","model_type":"transcription","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"quantization":"bf16","tagline":"Voxtral Small is an enhancement of Mistral Small 3, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance."},{"id":"moonshotai/Kimi-K2.5","name":"Kimi-K2.5","created_by":"moonshot","source":"official","last_updated":"2026-04-26","family":"Kimi-K2.5","description":"Kimi K2.5 is an open-source, native multimodal agentic model built through continual pretraining on approximately 15 trillion mixed visual and text tokens atop Kimi-K2-Base. It seamlessly integrates vision and language understanding with advanced agentic capabilities, instant and thinking modes, as well as conversational and agentic paradigms.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"modified-mit","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.45,"output":2.25,"cached_input":0.07},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"Kimi K2.5 is an open-source, native multimodal agentic model built through continual pretraining on approximately 15 trillion mixed visual and text tokens atop Kimi-K2-Base.","max_output_tokens":32768},{"id":"moonshotai/Kimi-K2.6","name":"Kimi-K2.6","created_by":"moonshot","source":"official","last_updated":"2026-06-03","family":"Kimi-K2.6","description":"Kimi K2.6 is an open-source, native multimodal agentic model that advances practical capabilities in long-horizon coding, coding-driven design, proactive autonomous execution, and swarm-based task orchestration.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"modified-mit","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.75,"output":3.5,"cached_input":0.15},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"Kimi K2.6 is an open-source, native multimodal agentic model that advances practical capabilities in long-horizon coding, coding-driven design, proactive autonomous execution, and swarm-based task orc"},{"id":"moonshotai/Kimi-K2.7-Code","name":"Kimi-K2.7-Code","created_by":"moonshot","source":"official","family":"Kimi-K2.7","description":"Kimi K2.7 Code is a coding-focused agentic model built upon Kimi K2.6. With substantial improvements on real-world long-horizon coding tasks, it strengthens end-to-end task completion across complex software engineering workflows while improving token efficiency, reducing thinking-token usage by approximately 30% compared with Kimi K2.6.","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"license":"modified-mit","open_weight":true,"tagline":"Kimi K2.7 Code is a coding-focused agentic model built upon Kimi K2.6.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.74,"output":3.5,"cached_input":0.15},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","last_updated":"2026-06-18"},{"id":"NousResearch/Hermes-3-Llama-3.1-405B","name":"Hermes-3-Llama-3.1-405B","created_by":"nousresearch","source":"official","last_updated":"2026-04-26","family":"llama-3.1","description":"Hermes 3 is a cutting-edge language model that offers advanced capabilities in roleplaying, reasoning, and conversation. It's a fine-tuned version of the Llama-3.1 405B foundation model, designed to align with user needs and provide powerful control. Key features include reliable function calling, structured output, generalist assistant capabilities, and improved code generation. Hermes 3 is competitive with Llama-3.1 Instruct models, with its own strengths and weaknesses.","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1,"output":1},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Hermes 3 is a cutting-edge language model that offers advanced capabilities in roleplaying, reasoning, and conversation."},{"id":"NousResearch/Hermes-3-Llama-3.1-70B","name":"Hermes-3-Llama-3.1-70B","created_by":"nousresearch","source":"official","last_updated":"2026-06-10","family":"llama-3.1","description":"Hermes 3 is a generalist language model with many improvements over Hermes 2, including advanced agentic capabilities, much better roleplaying, reasoning, multi-turn conversation, long context coherence, and improvements across the board.","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.7,"output":0.7},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Hermes 3 is a generalist language model with many improvements over Hermes 2, including advanced agentic capabilities, much better roleplaying, reasoning, multi-turn conversation, long context coheren"},{"id":"nvidia/Cosmos3-Nano","name":"Cosmos3-Nano","created_by":"nvidia","source":"official","description":"Cosmos3 is a world foundation model that unifies understanding and generation within a single Mixture-of-Transformer (MoT) architecture. Two tightly coupled towers—a Reasoner (vision-language model) and a Generator (world simulator)—share latent representations so that structured perception directly grounds realistic, temporally consistent simulation.","status":"active","model_type":"video","open_weight":true,"tagline":"Cosmos3 is a world foundation model that unifies understanding and generation within a single Mixture-of-Transformer (MoT) architecture.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.0108 / second (480p)"],"last_updated":"2026-06-03"},{"id":"nvidia/Cosmos3-Super","name":"Cosmos3-Super","created_by":"nvidia","source":"official","description":"Cosmos3 is a world foundation model that unifies understanding and generation within a single Mixture-of-Transformer (MoT) architecture. Two tightly coupled towers—a Reasoner (vision-language model) and a Generator (world simulator)—share latent representations so that structured perception directly grounds realistic, temporally consistent simulation.","status":"active","model_type":"video","open_weight":true,"tagline":"Cosmos3 is a world foundation model that unifies understanding and generation within a single Mixture-of-Transformer (MoT) architecture.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.0432 / second (480p)"],"last_updated":"2026-06-10"},{"id":"nvidia/Llama-3.1-Nemotron-70B-Instruct","name":"Llama-3.1-Nemotron-70B-Instruct","created_by":"nvidia","source":"official","last_updated":"2026-04-26","family":"Llama-3.1","description":"Llama-3.1-Nemotron-70B-Instruct is a large language model customized by NVIDIA to improve the helpfulness of LLM generated responses to user queries. This model reaches Arena Hard of 85.0, AlpacaEval 2 LC of 57.6 and GPT-4-Turbo MT-Bench of 8.98, which are known to be predictive of LMSys Chatbot Arena Elo. As of 16th Oct 2024, this model is #1 on all three automatic alignment benchmarks (verified tab for AlpacaEval 2 LC), edging out strong frontier models such as GPT-4o and Claude 3.5 Sonnet.","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1.2,"output":1.2},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Llama-3.1-Nemotron-70B-Instruct is a large language model customized by NVIDIA to improve the helpfulness of LLM generated responses to user queries."},{"id":"nvidia/Llama-3.3-Nemotron-Super-49B-v1.5","name":"Llama-3.3-Nemotron-Super-49B-v1.5","created_by":"nvidia","source":"official","last_updated":"2026-06-10","family":"Llama-3.3","description":"Llama-3.3-Nemotron-Super-49B-v1.5 is a large language model (LLM) optimized for advanced reasoning, conversational interactions, retrieval-augmented generation (RAG), and tool-calling tasks. Derived from Meta's Llama-3.3-70B-Instruct, it employs a Neural Architecture Search (NAS) approach, significantly enhancing efficiency and reducing memory requirements.","status":"active","model_type":"chat","context_window":131072,"reasoning_tokens":true,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.4,"output":0.4},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Llama-3.3-Nemotron-Super-49B-v1.5 is a large language model (LLM) optimized for advanced reasoning, conversational interactions, retrieval-augmented generation (RAG), and tool-calling tasks."},{"id":"nvidia/llama-nemotron-embed-vl-1b-v2","name":"llama-nemotron-embed-vl-1b-v2","created_by":"nvidia","source":"official","last_updated":"2026-04-26","family":"llama","description":"The llama-nemotron-embed-vl-1b-v2 is a high-performance multimodal embedding model designed to transform text queries and document images into dense vector representations for advanced retrieval systems. It excels at understanding complex visual content like charts, tables, and infographics.","status":"active","model_type":"embed","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The llama-nemotron-embed-vl-1b-v2 is a high-performance multimodal embedding model designed to transform text queries and document images into dense vector representations for advanced retrieval systems."},{"id":"nvidia/llama-nemotron-rerank-vl-1b-v2","name":"llama-nemotron-rerank-vl-1b-v2","created_by":"nvidia","source":"official","last_updated":"2026-04-26","family":"llama","description":"The llama-nemotron-rerank-vl-1b-v2 is a 1.7B parameter multimodal reranking model designed to evaluate and order the relevance of document images and text against specific user queries. It excels at understanding complex visual content like charts, tables, and infographics.","status":"active","model_type":"rerank","open_weight":true,"modalities":{"input":["text"],"output":["text"]},"endpoints":["rerank"],"quantization":"bf16","tagline":"The llama-nemotron-rerank-vl-1b-v2 is a 1.7B parameter multimodal reranking model designed to evaluate and order the relevance of document images and text against specific user queries."},{"id":"nvidia/Nemotron-3-Nano-30B-A3B","name":"Nemotron-3-Nano-30B-A3B","created_by":"nvidia","source":"official","last_updated":"2026-04-26","family":"nemotron","description":"NVIDIA Nemotron 3 Nano is an open small reasoning model optimized for fast, cost-efficient inference in agentic and production workloads. Built with a hybrid Mixture-of-Experts (MoE) and Mamba-Transformer architecture, it delivers strong multi-step reasoning, high token throughput, stable latency with predictable cost, and efficient deployment for agent-based systems. Designed for real-world AI systems where reasoning can generate significantly more tokens per prompt, Nemotron Nano reduces co...","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"capabilities":{"tool_call":true,"reasoning":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.05,"output":0.2},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"NVIDIA Nemotron 3 Nano is an open small reasoning model optimized for fast, cost-efficient inference in agentic and production workloads."},{"id":"nvidia/Nemotron-3-Nano-Omni-30B-A3B-Reasoning","name":"Nemotron-3-Nano-Omni-30B-A3B-Reasoning","created_by":"nvidia","source":"official","description":"Nemotron 3 Nano Omni is an open multimodal model built on a hybrid Mixture-of-Experts (MoE) architecture, engineered for high efficiency and strong accuracy across image, video, audio, and text inputs. It powers always-on sub-agents for computer use, document intelligence, and audio-video understanding—replacing fragmented vision, speech, and language pipelines with a single unified inference pass.","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"open_weight":true,"tagline":"Nemotron 3 Nano Omni is an open multimodal model built on a hybrid Mixture-of-Experts (MoE) architecture, engineered for high efficiency and strong accuracy across image, video, audio, and text inputs.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":0.8},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","last_updated":"2026-06-03"},{"id":"nvidia/Nemotron-3.5-ASR-Streaming-Multilingual-0.6b","name":"Nemotron-3.5-ASR-Streaming-Multilingual-0.6b","created_by":"nvidia","source":"official","description":"Nemotron 3.5 ASR Streaming Multilingual is an open 0.6B-parameter prompt-conditioned cache-aware FastConformer-RNNT model, engineered for low-latency streaming transcription across 40+ languages. It powers real-time captioning, voice agents, and multilingual transcription pipelines—replacing separate per-language Whisper deployments with a single inference pass.","status":"active","model_type":"transcription","open_weight":true,"tagline":"Nemotron 3.5 ASR Streaming Multilingual is an open 0.6B-parameter prompt-conditioned cache-aware FastConformer-RNNT model, engineered for low-latency streaming transcription across 40+ languages.","capabilities":{"streaming":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_updated":"2026-06-10"},{"id":"nvidia/Nemotron-Content-Safety-3.5","name":"Nemotron-Content-Safety-3.5","created_by":"nvidia","source":"official","description":"Nemotron Content Safety 3.5 is a multimodal safety classifier developed by NVIDIA. A compact safety model that handles text, images, and custom policies. It outputs a safe/unsafe classification plus a reasoning trace, and can be used as an inference-time guardrail, as a judge for LLM safety testing and evaluation, or with the accompanying training dataset to post-train models for safer behavior.","status":"active","context_window":131072,"model_type":"chat","open_weight":true,"tagline":"Nemotron Content Safety 3.5 is a multimodal safety classifier developed by NVIDIA.","capabilities":{"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":0.2},"endpoints":["chat_completions"],"quantization":"bfloat16","last_updated":"2026-06-10"},{"id":"nvidia/NVIDIA-Nemotron-3-Super-120B-A12B","name":"NVIDIA-Nemotron-3-Super-120B-A12B","created_by":"nvidia","source":"official","last_updated":"2026-06-29","family":"nemotron","description":"NVIDIA Nemotron 3 Super is a hybrid Mixture-of-Experts (MoE) model engineered for highest compute efficiency and accuracy in multi-agent applications and specialized agentic systems. It is optimized to run many collaborating agents per application on a single GPU, delivering high accuracy for reasoning, tool use, and instruction following.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.085,"output":0.4},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"NVIDIA Nemotron 3 Super is a hybrid Mixture-of-Experts (MoE) model engineered for highest compute efficiency and accuracy in multi-agent applications and specialized agentic systems."},{"id":"nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B-BF16","name":"NVIDIA-Nemotron-3-Ultra-550B-A55B-BF16","created_by":"nvidia","source":"official","description":"Nemotron 3 Ultra is built for, frontier reasoning, orchestration, coding agents, deep research, and complex enterprise workflows. It delivers up to 5x faster inference and up to 30% lower cost for agentic workloads while supporting up to 1M token context.","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"open_weight":true,"tagline":"Nemotron 3 Ultra is built for, frontier reasoning, orchestration, coding agents, deep research, and complex enterprise workflows.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1,"output":5,"cached_input":0.3},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-18"},{"id":"nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B","name":"NVIDIA-Nemotron-3-Ultra-550B-A55B","created_by":"nvidia","source":"official","description":"Nemotron 3 Ultra is built for, frontier reasoning, orchestration, coding agents, deep research, and complex enterprise workflows. It delivers up to 5x faster inference and up to 30% lower cost for agentic workloads while supporting up to 1M token context.","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"open_weight":true,"tagline":"Nemotron 3 Ultra is built for, frontier reasoning, orchestration, coding agents, deep research, and complex enterprise workflows.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.5,"output":2.2,"cached_input":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-18"},{"id":"nvidia/NVIDIA-Nemotron-Nano-12B-v2-VL","name":"NVIDIA-Nemotron-Nano-12B-v2-VL","created_by":"nvidia","source":"official","last_updated":"2026-04-26","family":"nemotron","description":"NVIDIA Nemotron 2 Nano VL extends the Nemotron family into multi-modal reasoning and document intelligence. This auto-regressive vision-language model enables multi-image reasoning, video understanding, visual Q&A and document analysis and summarization. Optimized for enterprise AI workflows, it powers multimodal agentic systems such as visual copilots, document assistants, and knowledge automation pipelines.","status":"active","model_type":"chat","context_window":131072,"reasoning_tokens":true,"open_weight":true,"capabilities":{"reasoning":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":0.6},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"NVIDIA Nemotron 2 Nano VL extends the Nemotron family into multi-modal reasoning and document intelligence."},{"id":"nvidia/NVIDIA-Nemotron-Nano-9B-v2","name":"NVIDIA-Nemotron-Nano-9B-v2","created_by":"nvidia","source":"official","last_updated":"2026-04-26","family":"nemotron","description":"NVIDIA-Nemotron-Nano-9B-v2 is a large language model (LLM) trained from scratch by NVIDIA, and designed as a unified model for both reasoning and non-reasoning tasks. It responds to user queries and tasks by first generating a reasoning trace and then concluding with a final response. The model's reasoning capabilities can be controlled via a system prompt. If the user prefers the model to provide its final answer without intermediate reasoning traces, it can be configured to do so.","status":"active","model_type":"chat","context_window":131072,"reasoning_tokens":true,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.04,"output":0.16},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"NVIDIA-Nemotron-Nano-9B-v2 is a large language model (LLM) trained from scratch by NVIDIA, and designed as a unified model for both reasoning and non-reasoning tasks."},{"id":"openai/clip-vit-base-patch32","name":"clip-vit-base-patch32","created_by":"openai","source":"official","last_updated":"2026-04-26","family":"openai","description":"The CLIP model was developed by OpenAI to investigate the robustness of computer vision models. It uses a Vision Transformer architecture and was trained on a large dataset of image-caption pairs. The model shows promise in various computer vision tasks but also has limitations, including difficulties with fine-grained classification and potential biases in certain applications.","status":"active","model_type":"image","open_weight":true,"license":"proprietary","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.000500 per second"],"tagline":"The CLIP model was developed by OpenAI to investigate the robustness of computer vision models."},{"id":"openai/clip-vit-large-patch14-336","name":"clip-vit-large-patch14-336","created_by":"openai","source":"official","last_updated":"2026-04-26","family":"openai","description":"A zero-shot-image-classification model released by OpenAI. The clip-vit-large-patch14-336 model was trained from scratch on an unknown dataset and achieves unspecified results on the evaluation set. The model's intended uses and limitations, as well as its training and evaluation data, are not provided. The training procedure used an unknown optimizer and precision, and the framework versions included Transformers 4.21.3, TensorFlow 2.8.2, and Tokenizers 0.12.1.","status":"active","model_type":"image","open_weight":true,"license":"proprietary","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.000500 per second"],"tagline":"A zero-shot-image-classification model released by OpenAI."},{"id":"openai/gpt-oss-120b-Turbo","name":"gpt-oss-120b-Turbo","created_by":"openai","source":"official","last_updated":"2026-04-26","family":"gpt-oss","status":"active","model_type":"chat","context_window":131072,"reasoning_tokens":true,"open_weight":true,"license":"proprietary","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.15,"output":0.6},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16"},{"id":"openai/gpt-oss-120b","name":"gpt-oss-120b","created_by":"openai","source":"official","last_updated":"2026-04-26","family":"gpt-oss","description":"gpt-oss-120b is an open-weight, 117B-parameter Mixture-of-Experts (MoE) language model from OpenAI designed for high-reasoning, agentic, and general-purpose production use cases. The model supports configurable reasoning depth, full chain-of-thought access, and native tool use, including function calling, browsing, and structured output generation.","status":"active","model_type":"chat","context_window":131072,"reasoning_tokens":true,"open_weight":true,"license":"proprietary","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":false,"vision":false,"batch":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.039,"output":0.19},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"gpt-oss-120b is an open-weight, 117B-parameter Mixture-of-Experts (MoE) language model from OpenAI designed for high-reasoning, agentic, and general-purpose production use cases.","max_output_tokens":131072,"knowledge_cutoff":"2024-06","parameters":120},{"id":"openai/gpt-oss-20b","name":"gpt-oss-20b","created_by":"openai","source":"official","last_updated":"2026-04-26","family":"gpt-oss","description":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.0 license. It uses a Mixture-of-Experts (MoE) architecture with 3.6B active parameters per forward pass, optimized for lower-latency inference. The model is trained in OpenAI’s Harmony response format and supports reasoning level configuration, fine-tuning, and agentic capabilities including function calling, tool use, and structured outputs.","status":"active","model_type":"chat","context_window":131072,"reasoning_tokens":true,"open_weight":true,"license":"proprietary","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":false,"vision":false,"batch":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.03,"output":0.14},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.0 license.","max_output_tokens":131072,"knowledge_cutoff":"2024-06","parameters":20},{"id":"openai/whisper-large-v3-turbo","name":"whisper-large-v3-turbo","created_by":"openai","source":"official","last_updated":"2026-04-26","family":"whisper","description":"Whisper is a state-of-the-art model for automatic speech recognition (ASR) and speech translation, proposed in the paper \"Robust Speech Recognition via Large-Scale Weak Supervision\" by Alec Radford et al. from OpenAI. Trained on >5M hours of labeled data, Whisper demonstrates a strong ability to generalise to many datasets and domains in a zero-shot setting. Whisper large-v3-turbo is a finetuned version of a pruned Whisper large-v3. In other words, it's the exact same model, except that the n...","status":"active","model_type":"transcription","open_weight":true,"license":"proprietary","capabilities":{"streaming":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"tagline":"Whisper is a state-of-the-art model for automatic speech recognition (ASR) and speech translation, proposed in the paper \"Robust Speech Recognition via Large-Scale Weak Supervision\" by Alec Radford et al."},{"id":"openai/whisper-large-v3","name":"whisper-large-v3","created_by":"openai","source":"official","last_updated":"2026-04-26","family":"whisper","description":"Whisper is a general-purpose speech recognition model. It is trained on a large dataset of diverse audio and is also a multi-task model that can perform multilingual speech recognition as well as speech translation and language identification.","status":"active","model_type":"transcription","open_weight":true,"license":"proprietary","capabilities":{"streaming":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"tagline":"Whisper is a general-purpose speech recognition model."},{"id":"PaddlePaddle/PaddleOCR-VL-0.9B","name":"PaddleOCR-VL-0.9B","created_by":"paddlepaddle","source":"official","last_updated":"2026-04-26","family":"paddlepaddle","description":"PaddleOCR-VL is a SOTA and resource-efficient model tailored for document parsing. Its core component is PaddleOCR-VL-0.9B, a compact yet powerful vision-language model (VLM) that integrates a NaViT-style dynamic resolution visual encoder with the ERNIE-4.5-0.3B language model to enable accurate element recognition. This innovative model efficiently supports 109 languages and excels in recognizing complex elements (e.g., text, tables, formulas, and charts), while maintaining minimal resource ...","status":"active","model_type":"chat","context_window":16384,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.14,"output":0.8},"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"PaddleOCR-VL is a SOTA and resource-efficient model tailored for document parsing."},{"id":"Pixverse/Pixverse-6-I2V","name":"Pixverse-6-I2V","created_by":"pixverse","source":"official","description":"PixVerse V6 redefines AI video by shifting from isolated generation to a unified, model-driven workflow. Key upgrades include 15-second durations at 1080p resolution and a multi-shot engine. This transition allows creators to move beyond short clips toward meaningful narrative production and professional-grade marketing assets suitable for 2026 digital distribution standards.","status":"active","model_type":"video","open_weight":false,"tagline":"PixVerse V6 redefines AI video by shifting from isolated generation to a unified, model-driven workflow.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.045 / second"],"last_updated":"2026-06-03"},{"id":"Pixverse/Pixverse-6-T2V","name":"Pixverse-6-T2V","created_by":"pixverse","source":"official","description":"PixVerse V6 redefines AI video by shifting from isolated generation to a unified, model-driven workflow. Key upgrades include 15-second durations at 1080p resolution and a multi-shot engine. This transition allows creators to move beyond short clips toward meaningful narrative production and professional-grade marketing assets suitable for 2026 digital distribution standards.","status":"active","model_type":"video","open_weight":false,"tagline":"PixVerse V6 redefines AI video by shifting from isolated generation to a unified, model-driven workflow.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.045 / second"],"last_updated":"2026-06-03"},{"id":"Pixverse/Pixverse-T2V-HD","name":"Pixverse-T2V-HD","created_by":"pixverse","source":"official","last_updated":"2026-04-26","family":"pixverse","description":"The 1080p high-fidelity mode in PixVerse renders videos with significantly enhanced sharpness and visual clarity, capturing intricate details and providing a crisp, professional-grade quality suitable for more polished projects.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.4000 per image unit (0x0 default)"],"tagline":"The 1080p high-fidelity mode in PixVerse renders videos with significantly enhanced sharpness and visual clarity, capturing intricate details and providing a crisp, professional-grade quality suitable"},{"id":"Pixverse/Pixverse-T2V","name":"Pixverse-T2V","created_by":"pixverse","source":"official","last_updated":"2026-04-26","family":"pixverse","description":"PixVerse's 720p resolution offers a fast and reliable option for generating standard HD videos, ideal for quick previews and social media content where generation speed is prioritized over maximum detail.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.2000 per image unit (0x0 default)"],"tagline":"PixVerse's 720p resolution offers a fast and reliable option for generating standard HD videos, ideal for quick previews and social media content where generation speed is prioritized over maximum det"},{"id":"PrunaAI/p-image-Edit","name":"p-image-Edit","created_by":"prunaai","source":"official","last_updated":"2026-04-26","family":"prunaai","description":"P-Image-Edit is a high-precision image editing model that applies complex transformations, insertions, removals, and style adjustments in under a second. It delivers state-of-the-art accuracy, clean boundaries, and reliable prompt alignment, making multi-step edits fast, consistent, and production-ready.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0100 per image unit (0x0 default)"],"tagline":"P-Image-Edit is a high-precision image editing model that applies complex transformations, insertions, removals, and style adjustments in under a second."},{"id":"PrunaAI/p-image","name":"p-image","created_by":"prunaai","source":"official","last_updated":"2026-04-26","family":"prunaai","description":"P-Image is a state-of-the-art real-time generation model with exceptional text rendering, fine-detail accuracy, and rock-solid prompt adherence. It’s built for instant creativity at high-fidelity images in about one second at a fraction of typical model costs.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0050 per image unit (0x0 default)"],"tagline":"P-Image is a state-of-the-art real-time generation model with exceptional text rendering, fine-detail accuracy, and rock-solid prompt adherence."},{"id":"PrunaAI/p-video-avatar","name":"p-video-avatar","created_by":"prunaai","source":"official","description":"Pruna's talking head video generation model. Provide a portrait image and either a speech script or an audio file, and the model generates a realistic video of the person speaking. Supports multiple voices, languages, and output resolutions.","status":"active","model_type":"video","open_weight":false,"tagline":"Pruna's talking head video generation model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.025 / second"],"last_updated":"2026-06-03"},{"id":"PrunaAI/p-video","name":"p-video","created_by":"prunaai","source":"official","last_updated":"2026-04-26","family":"prunaai","description":"Real-time AI video generation from text, images, and audio. Supports up to 1080p at 48 FPS with built-in audio generation, draft mode for 4x faster previews, and prompt upsampling.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.02 / second"],"tagline":"Real-time AI video generation from text, images, and audio."},{"id":"Qwen/Qwen-Image-Edit-Max","name":"Qwen-Image-Edit-Max","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen","description":"Enhanced industrial design and geometric reasoning, improved character consistency, reduced offset issues, and integrated LoRA capabilities","status":"active","model_type":"image","open_weight":false,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0750 per image unit (0x0 default)"],"tagline":"Enhanced industrial design and geometric reasoning, improved character consistency, reduced offset issues, and integrated LoRA capabilities"},{"id":"Qwen/Qwen-Image-Edit","name":"Qwen-Image-Edit","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen","description":"Qwen-Image-Edit is a next-generation image editing model built on top of Qwen-Image, designed for both semantic and appearance-level edits. It excels at tasks like precise text modifications, style transfers, viewpoint transformations, and element adjustments while preserving overall visual consistency.","status":"active","model_type":"image","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0250 per image unit (1024x1024 default)"],"tagline":"Qwen-Image-Edit is a next-generation image editing model built on top of Qwen-Image, designed for both semantic and appearance-level edits."},{"id":"Qwen/Qwen-Image-Max","name":"Qwen-Image-Max","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen","description":"Compared with the Plus series, it significantly reduces the “AI-like” feel in generated images, enhancing their realism. It delivers more lifelike material textures for human subjects, finer and more detailed natural textures, and more visually appealing text rendering.","status":"active","model_type":"image","open_weight":false,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0750 per image unit (0x0 default)"],"tagline":"Compared with the Plus series, it significantly reduces the “AI-like” feel in generated images, enhancing their realism."},{"id":"Qwen/Qwen2.5-72B-Instruct","name":"Qwen2.5-72B-Instruct","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen2.5","description":"Qwen2.5 is a model pretrained on a large-scale dataset of up to 18 trillion tokens, offering significant improvements in knowledge, coding, mathematics, and instruction following compared to its predecessor Qwen2. The model also features enhanced capabilities in generating long texts, understanding structured data, and generating structured outputs, while supporting multilingual capabilities for over 29 languages.","status":"active","model_type":"chat","context_window":32768,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.36,"output":0.4},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen2.5 is a model pretrained on a large-scale dataset of up to 18 trillion tokens, offering significant improvements in knowledge, coding, mathematics, and instruction following compared to its predecessor Qwen2."},{"id":"Qwen/Qwen3-14B","name":"Qwen3-14B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Qwen3 is the latest generation of large language models in Qwen series, offering a comprehensive suite of dense and mixture-of-experts (MoE) models. Built upon extensive training, Qwen3 delivers groundbreaking advancements in reasoning, instruction-following, agent capabilities, and multilingual support.","status":"active","model_type":"chat","context_window":40960,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.12,"output":0.24},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3 is the latest generation of large language models in Qwen series, offering a comprehensive suite of dense and mixture-of-experts (MoE) models."},{"id":"Qwen/Qwen3-235B-A22B-Instruct-2507","name":"Qwen3-235B-A22B-Instruct-2507","created_by":"alibaba","source":"official","last_updated":"2026-06-10","family":"qwen3","description":"Qwen3-235B-A22B-Instruct-2507 is the updated version of the Qwen3-235B-A22B non-thinking mode, featuring Significant improvements in general capabilities, including instruction following, logical reasoning, text comprehension, mathematics, science, coding and tool usage.","status":"active","model_type":"chat","context_window":262144,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.09,"output":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3-235B-A22B-Instruct-2507 is the updated version of the Qwen3-235B-A22B non-thinking mode, featuring Significant improvements in general capabilities, including instruction following, logical reas"},{"id":"Qwen/Qwen3-235B-A22B-Thinking-2507","name":"Qwen3-235B-A22B-Thinking-2507","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Qwen3-235B-A22B-Thinking-2507 is the Qwen3's new model with scaling the thinking capability of Qwen3-235B-A22B, improving both the quality and depth of reasoning.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.23,"output":2.3,"cached_input":0.2},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3-235B-A22B-Thinking-2507 is the Qwen3's new model with scaling the thinking capability of Qwen3-235B-A22B, improving both the quality and depth of reasoning."},{"id":"Qwen/Qwen3-30B-A3B","name":"Qwen3-30B-A3B","created_by":"alibaba","source":"official","last_updated":"2026-06-10","family":"qwen3","description":"Qwen3 is the latest generation of large language models in Qwen series, offering a comprehensive suite of dense and mixture-of-experts (MoE) models. Built upon extensive training, Qwen3 delivers groundbreaking advancements in reasoning, instruction-following, agent capabilities, and multilingual support","status":"active","model_type":"chat","context_window":40960,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.12,"output":0.5},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3 is the latest generation of large language models in Qwen series, offering a comprehensive suite of dense and mixture-of-experts (MoE) models."},{"id":"Qwen/Qwen3-32B","name":"Qwen3-32B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Qwen3 is the latest generation of large language models in Qwen series, offering a comprehensive suite of dense and mixture-of-experts (MoE) models. Built upon extensive training, Qwen3 delivers groundbreaking advancements in reasoning, instruction-following, agent capabilities, and multilingual support","status":"active","model_type":"chat","context_window":40960,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.08,"output":0.28},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3 is the latest generation of large language models in Qwen series, offering a comprehensive suite of dense and mixture-of-experts (MoE) models."},{"id":"Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo","name":"Qwen3-Coder-480B-A35B-Instruct-Turbo","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Qwen3-Coder-480B-A35B-Instruct is the Qwen3's most agentic code model, featuring Significant Performance on Agentic Coding, Agentic Browser-Use and other foundational coding tasks, achieving results comparable to Claude Sonnet.","status":"active","model_type":"chat","context_window":262144,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.3,"output":1,"cached_input":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"Qwen3-Coder-480B-A35B-Instruct is the Qwen3's most agentic code model, featuring Significant Performance on Agentic Coding, Agentic Browser-Use and other foundational coding tasks, achieving results c"},{"id":"Qwen/Qwen3-Embedding-0.6B-batch","name":"Qwen3-Embedding-0.6B-batch","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B).","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Embedding-0.6B","name":"Qwen3-Embedding-0.6B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B).","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Embedding-4B-batch","name":"Qwen3-Embedding-4B-batch","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B).","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Embedding-4B","name":"Qwen3-Embedding-4B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B).","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Embedding-8B-batch","name":"Qwen3-Embedding-8B-batch","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B).","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Embedding-8B","name":"Qwen3-Embedding-8B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B).","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Max-Thinking","name":"Qwen3-Max-Thinking","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The latest flagship reasoning model in the Qwen3 family. Further enhanced by multiple innovations like adaptive tool-use and advanced test-time scaling techniques","status":"active","model_type":"chat","context_window":256000,"open_weight":false,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1.2,"output":6,"cached_input":0.24},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"The latest flagship reasoning model in the Qwen3 family."},{"id":"Qwen/Qwen3-Max","name":"Qwen3-Max","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The latest flagship model in the Qwen family. State-of-the-art results across a comprehensive suite of benchmarks — including knowledge, reasoning, coding, instruction following, human preference alignment, agent tasks, and multilingual understanding.","status":"active","model_type":"chat","context_window":256000,"open_weight":false,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1.2,"output":6,"cached_input":0.24},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"The latest flagship model in the Qwen family."},{"id":"Qwen/Qwen3-Next-80B-A3B-Instruct","name":"Qwen3-Next-80B-A3B-Instruct","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Over the past few months, we have observed increasingly clear trends toward scaling both total parameters and context lengths in the pursuit of more powerful and agentic artificial intelligence (AI). We are excited to share our latest advancements in addressing these demands, centered on improving scaling efficiency through innovative model architecture. We call this next-generation foundation models Qwen3-Next.","status":"active","model_type":"chat","context_window":262144,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.09,"output":1.1},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Over the past few months, we have observed increasingly clear trends toward scaling both total parameters and context lengths in the pursuit of more powerful and agentic artificial intelligence (AI)."},{"id":"Qwen/Qwen3-Reranker-0.6B","name":"Qwen3-Reranker-0.6B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B)","status":"active","model_type":"rerank","open_weight":true,"license":"apache-2.0","modalities":{"input":["text"],"output":["text"]},"endpoints":["rerank"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Reranker-4B","name":"Qwen3-Reranker-4B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B)","status":"active","model_type":"rerank","open_weight":true,"license":"apache-2.0","modalities":{"input":["text"],"output":["text"]},"endpoints":["rerank"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Reranker-8B","name":"Qwen3-Reranker-8B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B)","status":"active","model_type":"rerank","open_weight":true,"license":"apache-2.0","modalities":{"input":["text"],"output":["text"]},"endpoints":["rerank"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-TTS-VoiceDesign","name":"Qwen3-TTS-VoiceDesign","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"● Qwen3-TTS-VoiceDesign is a voice design variant of Qwen3-TTS by Alibaba's Qwen team. Instead of selecting from preset voices, you describe the voice you want in natural language — and the model generates speech in that voice. Key capabilities: - Natural language voice control — describe any voice with free text (e.g. \"a deep male voice with a calm, authoritative presence\", \"a young cheerful female with a warm and friendly tone\") - 10 languages — English, Chinese, Japanese, Korean, German, F...","status":"active","model_type":"tts","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$20.0000 per 1M input characters"],"tagline":"● Qwen3-TTS-VoiceDesign is a voice design variant of Qwen3-TTS by Alibaba's Qwen team."},{"id":"Qwen/Qwen3-TTS","name":"Qwen3-TTS","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Qwen3-TTS is an advanced text-to-speech model by Alibaba's Qwen team, delivering stable, expressive, and low-latency speech generation across 10 languages. Key capabilities: - 9 preset voices — Vivian, Serena, Uncle_Fu, Dylan, Eric, Ryan, Aiden, Ono_Anna, Sohee — covering diverse genders, ages, and accents - Voice cloning — clone any voice from a short (~3s) audio sample via the voice_id parameter - Instruction control — adjust tone, emotion, and speaking style with natural language (e.g. \"sp...","status":"active","model_type":"tts","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$20.0000 per 1M input characters"],"tagline":"Qwen3-TTS is an advanced text-to-speech model by Alibaba's Qwen team, delivering stable, expressive, and low-latency speech generation across 10 languages."},{"id":"Qwen/Qwen3-VL-235B-A22B-Instruct","name":"Qwen3-VL-235B-A22B-Instruct","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Meet Qwen3-VL — the most powerful vision-language model in the Qwen series to date. This generation delivers comprehensive upgrades across the board: superior text understanding & generation, deeper visual perception & reasoning, extended context length, enhanced spatial and video dynamics comprehension, and stronger agent interaction capabilities.","status":"active","model_type":"chat","context_window":262144,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":0.88,"cached_input":0.11},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Meet Qwen3-VL — the most powerful vision-language model in the Qwen series to date."},{"id":"Qwen/Qwen3-VL-30B-A3B-Instruct","name":"Qwen3-VL-30B-A3B-Instruct","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Meet Qwen3-VL — the most powerful vision-language model in the Qwen series to date. This generation delivers comprehensive upgrades across the board: superior text understanding & generation, deeper visual perception & reasoning, extended context length, enhanced spatial and video dynamics comprehension, and stronger agent interaction capabilities.","status":"active","model_type":"chat","context_window":262144,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.15,"output":0.6},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Meet Qwen3-VL — the most powerful vision-language model in the Qwen series to date."},{"id":"Qwen/Qwen3.5-0.8B","name":"Qwen3.5-0.8B","created_by":"alibaba","source":"official","last_updated":"2026-06-03","family":"qwen3","description":"Qwen3.5-0.8B is Alibaba's smallest model in the Qwen3.5 series, featuring a hybrid Gated Delta Networks and sparse Mixture-of-Experts architecture. Despite its compact size, it supports a 262K token context window, 201 languages, thinking/reasoning mode, and tool calling. Ideal for edge deployments, resource-constrained environments, and lightweight inference tasks.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.01,"output":0.05},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"Qwen3.5-0.8B is Alibaba's smallest model in the Qwen3.5 series, featuring a hybrid Gated Delta Networks and sparse Mixture-of-Experts architecture."},{"id":"Qwen/Qwen3.5-122B-A10B","name":"Qwen3.5-122B-A10B","created_by":"alibaba","source":"official","last_updated":"2026-06-29","family":"qwen3","description":"Qwen3.5-122B-A10B is a large Mixture-of-Experts model from Alibaba's Qwen3.5 series with 122B total parameters and 10B activated per token. It features a 262K token context window (extensible to 1M with YaRN), thinking/reasoning mode, tool calling, and support for 201 languages. Excels at complex reasoning, coding, multimodal understanding, and agentic tasks with the efficiency of sparse activation.","status":"active","model_type":"chat","context_window":16384,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.29,"output":2.4,"cached_input":0.145},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"Qwen3.5-122B-A10B is a large Mixture-of-Experts model from Alibaba's Qwen3.5 series with 122B total parameters and 10B activated per token."},{"id":"Qwen/Qwen3.5-27B","name":"Qwen3.5-27B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Qwen3.5-27B is Alibaba's largest dense Qwen3.5 model, delivering near-frontier quality across reasoning, coding, and instruction following. It features a 262K token context window (extensible to 1M), thinking/reasoning mode, tool calling, multi-token prediction, and support for 201 languages. Best suited for production deployments and complex enterprise tasks requiring top-tier performance.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.26,"output":2.6},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3.5-27B is Alibaba's largest dense Qwen3.5 model, delivering near-frontier quality across reasoning, coding, and instruction following."},{"id":"Qwen/Qwen3.5-2B","name":"Qwen3.5-2B","created_by":"alibaba","source":"official","last_updated":"2026-06-03","family":"qwen3","description":"Qwen3.5-2B is a compact yet capable model from Alibaba's Qwen3.5 series. It features a 262K token context window, support for 201 languages, thinking/reasoning mode, and tool calling for agentic workflows. A strong choice for prototyping, fine-tuning, and efficient multilingual deployments.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.02,"output":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"Qwen3.5-2B is a compact yet capable model from Alibaba's Qwen3.5 series."},{"id":"Qwen/Qwen3.5-35B-A3B","name":"Qwen3.5-35B-A3B","created_by":"alibaba","source":"official","last_updated":"2026-06-03","family":"qwen3","description":"Qwen3.5-35B-A3B is an efficient Mixture-of-Experts model from Alibaba's Qwen3.5 series with 35B total parameters and only 3B activated per token. It features a 262K token context window (extensible to 1M with YaRN), thinking/reasoning mode, tool calling, and support for 201 languages. Delivers strong performance on reasoning, coding, and vision-language tasks at a fraction of the compute cost.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.14,"output":1,"cached_input":0.05},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3.5-35B-A3B is an efficient Mixture-of-Experts model from Alibaba's Qwen3.5 series with 35B total parameters and only 3B activated per token."},{"id":"Qwen/Qwen3.5-397B-A17B","name":"Qwen3.5-397B-A17B","created_by":"alibaba","source":"official","last_updated":"2026-06-10","family":"qwen3","description":"Qwen3.5-397B-A17B is Alibaba's most capable Qwen3.5 model, a Mixture-of-Experts architecture with 397B total parameters and 17B activated per token. It features a 262K token context window (extensible to 1M with YaRN), thinking/reasoning mode, tool calling with MCP integration, and support for 201 languages. Sets state-of-the-art results on reasoning, coding, math, and multimodal benchmarks.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.45,"output":3,"cached_input":0.22},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3.5-397B-A17B is Alibaba's most capable Qwen3.5 model, a Mixture-of-Experts architecture with 397B total parameters and 17B activated per token."},{"id":"Qwen/Qwen3.5-4B","name":"Qwen3.5-4B","created_by":"alibaba","source":"official","last_updated":"2026-06-03","family":"qwen3","description":"Qwen3.5-4B is a mid-size model from Alibaba's Qwen3.5 series that delivers a strong balance of performance and efficiency. It features a 262K token context window (extensible to 1M with YaRN), thinking/reasoning mode, tool calling, and support for 201 languages. Well-suited for complex reasoning, code generation, and agentic applications.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.03,"output":0.15},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"Qwen3.5-4B is a mid-size model from Alibaba's Qwen3.5 series that delivers a strong balance of performance and efficiency."},{"id":"Qwen/Qwen3.5-9B","name":"Qwen3.5-9B","created_by":"alibaba","source":"official","description":"Qwen3.5-9B is a high-performance model from Alibaba's Qwen3.5 series with a hybrid Gated Delta Networks and sparse MoE architecture. It features a 262K token context window, thinking/reasoning mode, tool calling, multi-token prediction, and support for 201 languages. Excels at reasoning, coding, instruction following, and long-context tasks.","status":"active","context_window":262144,"model_type":"chat","license":"apache-2.0","open_weight":true,"tagline":"Qwen3.5-9B is a high-performance model from Alibaba's Qwen3.5 series with a hybrid Gated Delta Networks and sparse MoE architecture.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.1,"output":0.15},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","last_updated":"2026-06-10"},{"id":"Qwen/Qwen3.6-27B","name":"Qwen3.6-27B","created_by":"alibaba","source":"official","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"license":"apache-2.0","open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.32,"output":3.2},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","last_updated":"2026-06-03"},{"id":"Qwen/Qwen3.6-35B-A3B","name":"Qwen3.6-35B-A3B","created_by":"alibaba","source":"official","last_updated":"2026-06-03","family":"qwen3","description":"Qwen3.6-35B-A3B is Alibaba's latest flagship Mixture-of-Experts model, with 35B total parameters and only 3B activated per token (256 experts, 8 routed + 1 shared). Built on direct feedback from the community, Qwen3.6 prioritizes stability and real-world utility, offering developers a more intuitive, responsive, and genuinely productive coding experience.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.15,"output":0.95},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3.6-35B-A3B is Alibaba's latest flagship Mixture-of-Experts model, with 35B total parameters and only 3B activated per token (256 experts, 8 routed + 1 shared)."},{"id":"Qwen/Qwen3.7-Max","name":"Qwen3.7-Max","created_by":"alibaba","source":"official","description":"The largest and most capable in the Qwen3.7 series. Qwen3.7 is a next‑generation flagship model designed for the agent‑centric.","status":"active","context_window":256000,"model_type":"chat","license":"apache-2.0","open_weight":false,"tagline":"The largest and most capable in the Qwen3.7 series.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":2.5,"output":7.5,"cached_input":0.5},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03"},{"id":"ResembleAI/chatterbox-multilingual","name":"chatterbox-multilingual","created_by":"resembleai","source":"official","last_updated":"2026-04-26","family":"resembleai","description":"09/04 🔥 Introducing Chatterbox Multilingual in 23 Languages! We're excited to introduce Chatterbox and Chatterbox Multilingual, Resemble AI's production-grade open source TTS models. Chatterbox Multilingual supports Arabic, Danish, German, Greek, English, Spanish, Finnish, French, Hebrew, Hindi, Italian, Japanese, Korean, Malay, Dutch, Norwegian, Polish, Portuguese, Russian, Swedish, Swahili, Turkish, Chinese out of the box. Licensed under MIT, Chatterbox has been benchmarked against leading...","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$1.0000 per 1M input characters"],"tagline":"09/04 🔥 Introducing Chatterbox Multilingual in 23 Languages! We're excited to introduce Chatterbox and Chatterbox Multilingual, Resemble AI's production-grade open source TTS models."},{"id":"ResembleAI/chatterbox-turbo","name":"chatterbox-turbo","created_by":"resembleai","source":"official","last_updated":"2026-04-26","family":"resembleai","description":"Chatterbox is a family of three state-of-the-art, open-source text-to-speech models by Resemble AI. We are excited to introduce Chatterbox-Turbo, our most efficient model yet. Built on a streamlined 350M parameter architecture, Turbo delivers high-quality speech with less compute and VRAM than our previous models. We have also distilled the speech-token-to-mel decoder, previously a bottleneck, reducing generation from 10 steps to just one, while retaining high-fidelity audio output. Paralingu...","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$1.0000 per 1M input characters"],"tagline":"Chatterbox is a family of three state-of-the-art, open-source text-to-speech models by Resemble AI."},{"id":"Sao10K/L3-8B-Lunaris-v1-Turbo","name":"L3-8B-Lunaris-v1-Turbo","created_by":"sao10k","source":"official","last_updated":"2026-04-26","family":"sao10k","status":"active","model_type":"chat","context_window":8192,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.04,"output":0.05},"endpoints":["chat_completions"],"quantization":"fp8"},{"id":"Sao10K/L3.1-70B-Euryale-v2.2","name":"L3.1-70B-Euryale-v2.2","created_by":"sao10k","source":"official","last_updated":"2026-04-26","family":"sao10k","description":"Euryale 3.1 - 70B v2.2 is a model focused on creative roleplay from Sao10k","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.85,"output":0.85},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Euryale 3.1 - 70B v2.2 is a model focused on creative roleplay from Sao10k"},{"id":"Sao10K/L3.3-70B-Euryale-v2.3","name":"L3.3-70B-Euryale-v2.3","created_by":"sao10k","source":"official","last_updated":"2026-04-26","family":"sao10k","description":"L3.3-70B-Euryale-v2.3 is a model focused on creative roleplay from Sao10k","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.85,"output":0.85},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"L3.3-70B-Euryale-v2.3 is a model focused on creative roleplay from Sao10k"},{"id":"sentence-transformers/all-MiniLM-L12-v2","name":"all-MiniLM-L12-v2","created_by":"sentence-transformers","source":"official","last_updated":"2026-04-26","family":"sentence-transformers","description":"We present a sentence transformation model that generates semantically similar sentences. Our model is based on the Sentence-Transformers architecture and was trained on a large dataset of sentence pairs. We evaluate the effectiveness of our model by measuring its ability to generate similar sentences that are close to the original sentence in meaning.","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"We present a sentence transformation model that generates semantically similar sentences."},{"id":"sentence-transformers/all-MiniLM-L6-v2","name":"all-MiniLM-L6-v2","created_by":"sentence-transformers","source":"official","last_updated":"2026-04-26","family":"sentence-transformers","description":"We present a sentence transformation model that achieves state-of-the-art results on various NLP tasks without requiring task-specific architectures or fine-tuning. Our approach leverages contrastive learning and utilizes a variety of datasets to learn robust sentence representations. We evaluate our model on several benchmarks and demonstrate its effectiveness in various applications such as text classification, sentiment analysis, named entity recognition, and question answering.","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"We present a sentence transformation model that achieves state-of-the-art results on various NLP tasks without requiring task-specific architectures or fine-tuning."},{"id":"sentence-transformers/all-mpnet-base-v2","name":"all-mpnet-base-v2","created_by":"sentence-transformers","source":"official","last_updated":"2026-04-26","family":"sentence-transformers","description":"A sentence transformation model that has been trained on a wide range of datasets, including but not limited to S2ORC, WikiAnwers, PAQ, Stack Exchange, and Yahoo! Answers. Our model can be used for various NLP tasks such as clustering, sentiment analysis, and question answering.","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"A sentence transformation model that has been trained on a wide range of datasets, including but not limited to S2ORC, WikiAnwers, PAQ, Stack Exchange, and Yahoo! Answers."},{"id":"sentence-transformers/clip-ViT-B-32-multilingual-v1","name":"clip-ViT-B-32-multilingual-v1","created_by":"sentence-transformers","source":"official","last_updated":"2026-04-26","family":"sentence-transformers","description":"This model is a multilingual version of the OpenAI CLIP-ViT-B32 model, which maps text and images to a common dense vector space. It includes a text embedding model that works for 50+ languages and an image encoder from CLIP. The model was trained using Multilingual Knowledge Distillation, where a multilingual DistilBERT model was trained as a student model to align the vector space of the original CLIP image encoder across many languages.","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"This model is a multilingual version of the OpenAI CLIP-ViT-B32 model, which maps text and images to a common dense vector space."},{"id":"sentence-transformers/clip-ViT-B-32","name":"clip-ViT-B-32","created_by":"sentence-transformers","source":"official","last_updated":"2026-04-26","family":"sentence-transformers","description":"The CLIP model maps text and images to a shared vector space, enabling various applications such as image search, zero-shot image classification, and image clustering. The model can be used easily after installation, and its performance is demonstrated through zero-shot ImageNet validation set accuracy scores. Multilingual versions of the model are also available for 50+ languages.","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The CLIP model maps text and images to a shared vector space, enabling various applications such as image search, zero-shot image classification, and image clustering."},{"id":"sentence-transformers/multi-qa-mpnet-base-dot-v1","name":"multi-qa-mpnet-base-dot-v1","created_by":"sentence-transformers","source":"official","last_updated":"2026-04-26","family":"sentence-transformers","description":"We present a sentence transformation model that maps sentences and paragraphs to a 768-dimensional dense vector space, suitable for semantic search tasks. The model is trained on 215 million question-answer pairs from various sources, including WikiAnswers, PAQ, Stack Exchange, MS MARCO, GOOAQ, Amazon QA, Yahoo Answers, Search QA, ELI5, and Natural Questions. Our model uses a contrastive learning objective.","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"We present a sentence transformation model that maps sentences and paragraphs to a 768-dimensional dense vector space, suitable for semantic search tasks."},{"id":"sentence-transformers/paraphrase-MiniLM-L6-v2","name":"paraphrase-MiniLM-L6-v2","created_by":"sentence-transformers","source":"official","last_updated":"2026-04-26","family":"sentence-transformers","description":"We present a sentence similarity model based on the Sentence Transformers architecture, which maps sentences to a 384-dimensional dense vector space. The model uses a pre-trained BERT encoder and applies mean pooling on top of the contextualized word embeddings to obtain sentence embeddings. We evaluate the model on the Sentence Embeddings Benchmark.","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"We present a sentence similarity model based on the Sentence Transformers architecture, which maps sentences to a 384-dimensional dense vector space."},{"id":"sesame/csm-1b","name":"csm-1b","created_by":"sesame","source":"official","last_updated":"2026-04-26","family":"sesame","description":"CSM (Conversational Speech Model) is a speech generation model from Sesame that generates RVQ audio codes from text and audio inputs. The model architecture employs a Llama backbone and a smaller audio decoder that produces Mimi audio codes.","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$7.0000 per 1M input characters"],"tagline":"CSM (Conversational Speech Model) is a speech generation model from Sesame that generates RVQ audio codes from text and audio inputs."},{"id":"shibing624/text2vec-base-chinese","name":"text2vec-base-chinese","created_by":"shibing624","source":"official","last_updated":"2026-04-26","family":"shibing624","description":"A sentence similarity model that can be used for various NLP tasks such as text classification, sentiment analysis, named entity recognition, question answering, and more. It utilizes the CoSENT architecture, which consists of a transformer encoder and a pooling module, to encode input texts into vectors that capture their semantic meaning. The model was trained on the nli_zh dataset and achieved high performance on various benchmark datasets.","status":"active","model_type":"embed","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"A sentence similarity model that can be used for various NLP tasks such as text classification, sentiment analysis, named entity recognition, question answering, and more."},{"id":"stabilityai/sdxl-turbo","name":"sdxl-turbo","created_by":"stability-ai","source":"official","last_updated":"2026-04-26","family":"sdxl","description":"The SDXL Turbo model, developed by Stability AI, is an optimized, fast text-to-image generative model. It is a distilled version of SDXL 1.0, leveraging Adversarial Diffusion Distillation (ADD) to generate high-quality images in less steps.","status":"active","model_type":"image","open_weight":true,"license":"stability-ai","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0002 per image unit (1024x1024 default)"],"tagline":"The SDXL Turbo model, developed by Stability AI, is an optimized, fast text-to-image generative model."},{"id":"stepfun-ai/Step-3.5-Flash","name":"Step-3.5-Flash","created_by":"stepfun","source":"official","last_updated":"2026-06-03","family":"step-3","description":"Step 3.5 Flash is an open-source reasoning model by StepFun with 196B total parameters (11B active) using Mixture of Experts. It features a 256K context window, deep reasoning, tool calling, and agentic capabilities, achieving 97.3 on AIME 2025 and 74.4% on SWE-bench Verified.","status":"active","model_type":"chat","context_window":262144,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"streaming":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.09,"output":0.3,"cached_input":0.02},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Step 3.5 Flash is an open-source reasoning model by StepFun with 196B total parameters (11B active) using Mixture of Experts."},{"id":"stepfun-ai/Step-3.7-Flash","name":"Step-3.7-Flash","created_by":"stepfun","source":"official","description":"Step 3.7 Flash is an open-source multimodal reasoning model by StepFun with 198B total parameters (11B active) using Mixture of Experts. It accepts text and image inputs and features a 256K context window, selectable reasoning effort, tool calling, and agentic capabilities for coding and search workflows, scoring 80.9% on GPQA Diamond and 56.3% on SWE-bench Pro.","status":"active","context_window":262144,"model_type":"chat","license":"apache-2.0","open_weight":true,"tagline":"Step 3.7 Flash is an open-source multimodal reasoning model by StepFun with 198B total parameters (11B active) using Mixture of Experts.","capabilities":{"tool_call":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":1.15,"cached_input":0.04},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"modelopt","last_updated":"2026-06-18"},{"id":"thenlper/gte-base","name":"gte-base","created_by":"thenlper","source":"official","last_updated":"2026-04-26","family":"thenlper","description":"The GTE models are trained by Alibaba DAMO Academy. They are mainly based on the BERT framework and currently offer three different sizes of models, including GTE-large, GTE-base, and GTE-small. The GTE models are trained on a large-scale corpus of relevance text pairs, covering a wide range of domains and scenarios. This enables the GTE models to be applied to various downstream tasks of text embeddings, including information retrieval, semantic textual similarity, text reranking, etc.","status":"active","model_type":"embed","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The GTE models are trained by Alibaba DAMO Academy."},{"id":"thenlper/gte-large","name":"gte-large","created_by":"thenlper","source":"official","last_updated":"2026-04-26","family":"thenlper","description":"The GTE models are trained by Alibaba DAMO Academy. They are mainly based on the BERT framework and currently offer three different sizes of models, including GTE-large, GTE-base, and GTE-small. The GTE models are trained on a large-scale corpus of relevance text pairs, covering a wide range of domains and scenarios. This enables the GTE models to be applied to various downstream tasks of text embeddings, including information retrieval, semantic textual similarity, text reranking, etc.","status":"active","model_type":"embed","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The GTE models are trained by Alibaba DAMO Academy."},{"id":"Wan-AI/Wan2.2-T2V-A14B","name":"Wan2.2-T2V-A14B","created_by":"wan-ai","source":"official","last_updated":"2026-04-26","family":"Wan2.2","description":"The Wan2.2 T2V A14B is a next-generation 14B-parameter video foundation model by Wan-AI featuring a novel two-stage denoising architecture. It produces 480P videos with improved visual coherence and detail, generating 2 or 5 second clips at 16fps from text prompts.","status":"active","model_type":"video","open_weight":true,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"The Wan2.2 T2V A14B is a next-generation 14B-parameter video foundation model by Wan-AI featuring a novel two-stage denoising architecture."},{"id":"Wan-AI/Wan2.6-I2V","name":"Wan2.6-I2V","created_by":"wan-ai","source":"official","last_updated":"2026-04-26","family":"Wan2.6","description":"Turn any image into a video. Intelligent shot scheduling supports multi-shot storytelling, generating multi-shot narrative videos with consistent subjects, scenes, and atmosphere","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.10 / second"],"tagline":"Turn any image into a video."},{"id":"Wan-AI/Wan2.6-Image-Edit","name":"Wan2.6-Image-Edit","created_by":"wan-ai","source":"official","last_updated":"2026-04-26","family":"Wan2.6","description":"An all-round image generation model that supports joint text–image reasoning, multi-image creative fusion, commercial-grade consistency, aesthetic style transfer, and precise control of framing and lighting, significantly enhancing consistency, controllability, and expressiveness in image generation.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0300 per image unit (0x0 default)"],"tagline":"An all-round image generation model that supports joint text–image reasoning, multi-image creative fusion, commercial-grade consistency, aesthetic style transfer, and precise control of framing and li"},{"id":"Wan-AI/Wan2.6-T2I","name":"Wan2.6-T2I","created_by":"wan-ai","source":"official","last_updated":"2026-04-26","family":"Wan2.6","description":"Wan2.6 text to image, Upgraded visual quality, aesthetics, and instruction-following deliver precise style control, realistic portraits, long-text understanding, and broad historical/cultural IP coverage, enabling high-quality, highly expressive visual generation.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0300 per image unit (0x0 default)"],"tagline":"Wan2.6 text to image, Upgraded visual quality, aesthetics, and instruction-following deliver precise style control, realistic portraits, long-text understanding, and broad historical/cultural IP cover"},{"id":"Wan-AI/Wan2.6-T2V","name":"Wan2.6-T2V","created_by":"wan-ai","source":"official","last_updated":"2026-04-26","family":"Wan2.6","description":"Turn any prompt into a smooth video. Intelligent shot scheduling supports multi-shot storytelling, generating multi-shot narrative videos with consistent subjects, scenes, and atmosphere","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.10 / second"],"tagline":"Turn any prompt into a smooth video."},{"id":"Wan-AI/Wan2.7-I2V","name":"Wan2.7-I2V","created_by":"wan-ai","source":"official","family":"Wan2.7","description":"Generates video content from images while stably preserving details such as subject, style, and text elements. Ensures visual consistency and information fidelity throughout dynamic transitions.","status":"active","model_type":"video","open_weight":false,"tagline":"Generates video content from images while stably preserving details such as subject, style, and text elements.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.10 / second"],"last_updated":"2026-06-03"},{"id":"Wan-AI/Wan2.7-Image-Edit","name":"Wan2.7-Image-Edit","created_by":"wan-ai","source":"official","last_updated":"2026-04-26","family":"Wan2.7","description":"Bleeding edge image model supporting generation and editing, text to image, text/image to sequential images, image editing, multi-image reference generation, and interactive editing. Delivers enhanced performance in text rendering, subject consistency, and complex instruction following","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0300 per image unit (0x0 default)"],"tagline":"Bleeding edge image model supporting generation and editing, text to image, text/image to sequential images, image editing, multi-image reference generation, and interactive editing."},{"id":"Wan-AI/Wan2.7-R2V","name":"Wan2.7-R2V","created_by":"wan-ai","source":"official","family":"Wan2.7","description":"Accurately preserve the look and voice of people or objects from a reference video, supporting multi-reference co-creation.","status":"active","model_type":"video","open_weight":false,"tagline":"Accurately preserve the look and voice of people or objects from a reference video, supporting multi-reference co-creation.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.10 / second"],"last_updated":"2026-06-03"},{"id":"XiaomiMiMo/MiMo-V2.5-Pro","name":"MiMo-V2.5-Pro","created_by":"xiaomimimo","source":"official","family":"mimo","description":"MiMo-V2.5-Pro is an open-source Mixture-of-Experts (MoE) language model with 1.02T total parameters and 42B active parameters. It utilizes the hybrid attention architecture and 3-layers Multi-Token Prediction (MTP) introduced in [MiMo-V2-Flash](https://github.com/XiaomiMiMo/MiMo-V2-Flash).","status":"active","context_window":1048576,"model_type":"chat","reasoning_tokens":true,"open_weight":true,"tagline":"MiMo-V2.5-Pro is an open-source Mixture-of-Experts (MoE) language model with 1.02T total parameters and 42B active parameters.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1,"output":3,"cached_input":0.2},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","last_updated":"2026-06-03"},{"id":"XiaomiMiMo/MiMo-V2.5-tts-voiceclone","name":"MiMo-V2.5-tts-voiceclone","created_by":"xiaomimimo","source":"official","family":"mimo","description":"Automatically convert input text into natural and fluent speech output. You can generate natural and vivid speech content by configuring parameters such as speech. Precisely replicate voices from audio samples to enable speech synthesis of any voice. style and voice.","status":"active","model_type":"tts","open_weight":false,"tagline":"Automatically convert input text into natural and fluent speech output.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$0.0000 per 1M input characters"],"last_updated":"2026-06-03"},{"id":"XiaomiMiMo/MiMo-V2.5-tts-voicedesign","name":"MiMo-V2.5-tts-voicedesign","created_by":"xiaomimimo","source":"official","family":"mimo","description":"Automatically convert input text into natural and fluent speech output. You can generate natural and vivid speech content by configuring parameters such as speech style and voice. Automatically generate voices from text descriptions, without requiring presets or audio samples.","status":"active","model_type":"tts","open_weight":false,"tagline":"Automatically convert input text into natural and fluent speech output.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$0.0000 per 1M input characters"],"last_updated":"2026-06-03"},{"id":"XiaomiMiMo/MiMo-V2.5-tts","name":"MiMo-V2.5-tts","created_by":"xiaomimimo","source":"official","family":"mimo","description":"Automatically convert input text into natural and fluent speech output. You can generate natural and vivid speech content by configuring parameters such as speech style and voice. Use the high-quality voices from the built-in voices list.","status":"active","model_type":"tts","open_weight":false,"tagline":"Automatically convert input text into natural and fluent speech output.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$0.0000 per 1M input characters"],"last_updated":"2026-06-03"},{"id":"XiaomiMiMo/MiMo-V2.5","name":"MiMo-V2.5","created_by":"xiaomimimo","source":"official","family":"mimo","description":"MiMo-V2.5 is a native omnimodal model with strong agentic capabilities, supporting text, image, video, and audio understanding within a unified architecture. Built upon the MiMo-V2-Flash backbone and extended with dedicated vision and audio encoders, it delivers robust performance across multimodal perception, long-context reasoning, and agentic workflows.","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"open_weight":true,"tagline":"MiMo-V2.5 is a native omnimodal model with strong agentic capabilities, supporting text, image, video, and audio understanding within a unified architecture.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.4,"output":2,"cached_input":0.08},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03"},{"id":"zai-org/GLM-4.6","name":"GLM-4.6","created_by":"zhipu","source":"official","last_updated":"2026-04-26","family":"GLM-4.6","description":"Compared with GLM-4.5, GLM-4.6 brings several key improvements: Longer context window: The context window has been expanded from 128K to 200K tokens, enabling the model to handle more complex agentic tasks. Superior coding performance: The model achieves higher scores on code benchmarks and demonstrates better real-world performance in applications such as Claude Code、Cline、Roo Code and Kilo Code, including improvements in generating visually polished front-end pages. Advanced reasoning: GLM-...","status":"active","model_type":"chat","context_window":202752,"reasoning_tokens":true,"open_weight":true,"license":"mit","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.43,"output":1.74,"cached_input":0.08},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"Compared with GLM-4.5, GLM-4.6 brings several key improvements: Longer context window: The context window has been expanded from 128K to 200K tokens, enabling the model to handle more complex agentic tasks."},{"id":"zai-org/GLM-4.7-Flash","name":"GLM-4.7-Flash","created_by":"zhipu","source":"official","last_updated":"2026-04-26","family":"GLM-4.7","description":"GLM-4.7-Flash is a 30B-A3B MoE model. As the strongest model in the 30B class, GLM-4.7-Flash offers a new option for lightweight deployment that balances performance and efficiency.","status":"active","model_type":"chat","context_window":202752,"reasoning_tokens":true,"open_weight":true,"license":"mit","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.06,"output":0.4,"cached_input":0.01},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"GLM-4.7-Flash is a 30B-A3B MoE model."},{"id":"zai-org/GLM-4.7","name":"GLM-4.7","created_by":"zhipu","source":"official","last_updated":"2026-04-26","family":"GLM-4.7","description":"GLM-4.7 is a state-of-the-art, multilingual Mixture-of-Experts (MoE) language model designed for complex reasoning, agentic coding, and tool use. Building on its predecessor GLM-4.6, it delivers significant improvements across key benchmarks, including multilingual SWE-bench, Terminal Bench, and reasoning-heavy evaluations like HLE. The model features advanced \"Interleaved Thinking\" and new \"Preserved Thinking\" modes, allowing it to reason before actions and maintain consistency across long, ...","status":"active","model_type":"chat","context_window":202752,"reasoning_tokens":true,"open_weight":true,"license":"mit","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.4,"output":1.75,"cached_input":0.08},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"GLM-4.7 is a state-of-the-art, multilingual Mixture-of-Experts (MoE) language model designed for complex reasoning, agentic coding, and tool use."},{"id":"zai-org/GLM-5.1","name":"GLM-5.1","created_by":"zhipu","source":"official","last_updated":"2026-04-26","family":"GLM-5.1","description":"GLM-5.1 is Z-AI's next-generation flagship model for agentic engineering, with significantly stronger coding capabilities than its predecessor. It achieves state-of-the-art performance on SWE-Bench Pro and leads GLM-5 by a wide margin on NL2Repo (repo generation) and Terminal-Bench 2.0 (real-world terminal tasks).","status":"active","model_type":"chat","context_window":202752,"reasoning_tokens":true,"open_weight":true,"license":"mit","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1.05,"output":3.5,"cached_input":0.205},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"GLM-5.1 is Z-AI's next-generation flagship model for agentic engineering, with significantly stronger coding capabilities than its predecessor."},{"id":"zai-org/GLM-5.2","name":"GLM-5.2","created_by":"zhipu","source":"official","family":"GLM-5.2","description":"GLM-5.2 is Z-AI's latest flagship model for long-horizon tasks. It marks a substantial leap in long-horizon task capability over its predecessor GLM-5.1 and, for the first time, delivers that capability on a **solid 1M-token context**.","status":"active","context_window":1048576,"model_type":"chat","reasoning_tokens":true,"license":"mit","open_weight":true,"tagline":"GLM-5.2 is Z-AI's latest flagship model for long-horizon tasks.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.95,"output":3,"cached_input":0.18},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","last_updated":"2026-06-29"},{"id":"zai-org/GLM-5","name":"GLM-5","created_by":"zhipu","source":"official","last_updated":"2026-04-26","family":"GLM-5","description":"GLM-5 is an advanced, open-source large language model designed for developers tackling the toughest challenges. It excels at long-context reasoning, multi-step tool orchestration, and complex systems engineering, making it the ideal choice for powering sophisticated agents and applications that require high-level cognitive tasks.","status":"active","model_type":"chat","context_window":202752,"reasoning_tokens":true,"open_weight":true,"license":"mit","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.6,"output":2.08,"cached_input":0.12},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"GLM-5 is an advanced, open-source large language model designed for developers tackling the toughest challenges."},{"id":"Zyphra/Zonos-v0.1-hybrid","name":"Zonos-v0.1-hybrid","created_by":"zyphra","source":"official","last_updated":"2026-04-26","family":"zyphra","description":"Zonos-v0.1 is a leading open-weight text-to-speech model trained on more than 200k hours of varied multilingual speech, delivering expressiveness and quality on par with—or even surpassing—top TTS providers. Our model enables highly natural speech generation from text prompts when given a speaker embedding or audio prefix, and can accurately perform speech cloning when given a reference clip spanning just a few seconds. The conditioning setup also allows for fine control over speaking rate, p...","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$7.0000 per 1M input characters"],"tagline":"Zonos-v0.1 is a leading open-weight text-to-speech model trained on more than 200k hours of varied multilingual speech, delivering expressiveness and quality on par with—or even surpassing—top TTS providers."},{"id":"Zyphra/Zonos-v0.1-transformer","name":"Zonos-v0.1-transformer","created_by":"zyphra","source":"official","last_updated":"2026-04-26","family":"zyphra","description":"Zonos-v0.1 is a leading open-weight text-to-speech model trained on more than 200k hours of varied multilingual speech, delivering expressiveness and quality on par with—or even surpassing—top TTS providers. Our model enables highly natural speech generation from text prompts when given a speaker embedding or audio prefix, and can accurately perform speech cloning when given a reference clip spanning just a few seconds. The conditioning setup also allows for fine control over speaking rate, p...","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$7.0000 per 1M input characters"],"tagline":"Zonos-v0.1 is a leading open-weight text-to-speech model trained on more than 200k hours of varied multilingual speech, delivering expressiveness and quality on par with—or even surpassing—top TTS providers."}]}; +export const provider: ProviderWithModels = {"id":"deepinfra","name":"DeepInfra","region":"US","headquarters":"Palo Alto, CA","founded":2022,"url":"https://deepinfra.com","api_url":"https://api.deepinfra.com/v1/openai","docs_url":"https://deepinfra.com/docs","pricing_url":"https://deepinfra.com/pricing","description":"Serverless inference cloud for open-weight LLMs, image, video, TTS, transcription, embedding, and reranker models with an OpenAI-compatible API.","type":"cloud","playground_url":"https://deepinfra.com/chat","status_url":"https://status.deepinfra.com","openai_compatible":true,"free_tier":false,"github_url":"https://github.com/deepinfra","models_url":"https://deepinfra.com/models","twitter_url":"https://x.com/DeepInfra","discord_url":"https://discord.gg/deepinfra","blog_url":"https://deepinfra.com/blog","terms_url":"https://deepinfra.com/terms","support_url":"https://deepinfra.com/contact","icon":"\n \n \n","models":[{"id":"ACE-Step/acestep-v15-xl-sft","name":"acestep-v15-xl-sft","created_by":"ace-step","source":"official","description":"ACE-Step v1.5 is a powerful open-source music foundation model that turns a text prompt into a complete song — vocals, lyrics, and instrumentation — at quality that rivals commercial tools. We run the high-quality XL checkpoint with its planning step (\"thinking\") on by default, so generations favor musical structure and coherence over raw speed.","status":"active","model_type":"chat","open_weight":true,"tagline":"ACE-Step v1.5 is a powerful open-source music foundation model that turns a text prompt into a complete song — vocals, lyrics, and instrumentation — at quality that rivals commercial tools.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing_notes":["$0.001 / second of audio"],"last_updated":"2026-06-18"},{"id":"allenai/Olmo-3.1-32B-Instruct","name":"Olmo-3.1-32B-Instruct","created_by":"allenai","source":"official","last_updated":"2026-04-26","family":"allenai","description":"Olmo is a series of Open language models, developed by Allen Institute for AI (Ai2), designed to enable the science of language models.","status":"active","model_type":"chat","context_window":65536,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.2,"output":0.6},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Olmo is a series of Open language models, developed by Allen Institute for AI (Ai2), designed to enable the science of language models."},{"id":"allenai/olmOCR-2-7B-1025","name":"olmOCR-2-7B-1025","created_by":"allenai","source":"official","last_updated":"2026-04-26","family":"allenai","description":"olmOCR is a specialized AI tool that converts PDF documents into clean, structured text while preserving important formatting and layout information. What makes olmOCR particularly valuable for developers is its ability to handle challenging PDFs that traditional OCR tools struggle with—including complex layouts, poor-quality scans, handwritten text, and documents with mixed content types. Built on a fine-tuned 7B vision-language model, olmOCR provides enterprise-grade PDF processing at a fra...","status":"active","model_type":"chat","context_window":16384,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.09,"output":0.19},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"olmOCR is a specialized AI tool that converts PDF documents into clean, structured text while preserving important formatting and layout information."},{"id":"anthropic/claude-3-7-sonnet-latest","name":"claude-3-7-sonnet-latest","created_by":"anthropic","source":"official","last_updated":"2026-04-26","family":"claude-sonnet","status":"active","model_type":"chat","context_window":200000,"open_weight":false,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":3.3,"output":16.5,"cached_input":0.33},"tools":["function_calling"],"endpoints":["chat_completions"]},{"id":"anthropic/claude-4-opus","name":"claude-4-opus","created_by":"anthropic","source":"official","last_updated":"2026-04-26","family":"claude-opus","description":"Anthropic’s most powerful model yet and the state-of-the-art coding model. It delivers sustained performance on long-running tasks that require focused effort and thousands of steps, significantly expanding what AI agents can solve. Claude Opus 4 is ideal for powering frontier agent products and features.","status":"active","model_type":"chat","context_window":200000,"open_weight":false,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":16.5,"output":82.5},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Anthropic’s most powerful model yet and the state-of-the-art coding model."},{"id":"anthropic/claude-4-sonnet","name":"claude-4-sonnet","created_by":"anthropic","source":"official","last_updated":"2026-04-26","family":"claude-sonnet","description":"Anthropic's mid-size model with superior intelligence for high-volume uses in coding, in-depth research, agents, & more.","status":"active","model_type":"chat","context_window":200000,"open_weight":false,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":3.3,"output":16.5},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Anthropic's mid-size model with superior intelligence for high-volume uses in coding, in-depth research, agents, & more."},{"id":"anthropic/claude-haiku-4-5","name":"claude-haiku-4-5","created_by":"anthropic","source":"official","family":"claude-haiku","description":"The next generation of Anthropic's fastest and most cost-effective model, optimal for use cases where speed and affordability matter.","status":"active","context_window":200000,"model_type":"chat","reasoning_tokens":true,"open_weight":false,"tagline":"The next generation of Anthropic's fastest and most cost-effective model, optimal for use cases where speed and affordability matter.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1,"output":5},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03","max_output_tokens":64000,"knowledge_cutoff":"2025-02","training_data_cutoff":"2025-07","license":"proprietary"},{"id":"anthropic/claude-opus-4-7","name":"claude-opus-4-7","created_by":"anthropic","source":"official","family":"claude-opus","description":"Anthropic's most capable production model yet, advancing performance across coding, enterprise workflows, and long-running agentic tasks.","status":"active","context_window":1000000,"model_type":"chat","reasoning_tokens":true,"open_weight":false,"tagline":"Anthropic's most capable production model yet, advancing performance across coding, enterprise workflows, and long-running agentic tasks.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5,"output":25},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03","max_output_tokens":128000,"knowledge_cutoff":"2026-01","training_data_cutoff":"2026-01","license":"proprietary"},{"id":"anthropic/claude-opus-4-8","name":"claude-opus-4-8","created_by":"anthropic","source":"official","family":"claude-opus","description":"Claude Opus 4.8 is our most intelligent Opus model and the best generally available model for coding and agents, with deeper reasoning for enterprise workflows.","status":"active","context_window":1000000,"model_type":"chat","reasoning_tokens":true,"open_weight":false,"tagline":"Claude Opus 4.8 is our most intelligent Opus model and the best generally available model for coding and agents, with deeper reasoning for enterprise workflows.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5,"output":25},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03","max_output_tokens":128000,"knowledge_cutoff":"2026-01","training_data_cutoff":"2026-01","license":"proprietary"},{"id":"anthropic/claude-sonnet-4-6","name":"claude-sonnet-4-6","created_by":"anthropic","source":"official","family":"claude-sonnet","description":"Claude Sonnet 4.6 delivers frontier intelligence at scale—built for coding, agents, and enterprise workflows.","status":"active","context_window":1000000,"model_type":"chat","reasoning_tokens":true,"open_weight":false,"tagline":"Claude Sonnet 4.6 delivers frontier intelligence at scale—built for coding, agents, and enterprise workflows.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":3,"output":15},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03","max_output_tokens":64000,"knowledge_cutoff":"2025-08","training_data_cutoff":"2026-01","license":"proprietary"},{"id":"BAAI/bge-base-en-v1.5","name":"bge-base-en-v1.5","created_by":"baai","source":"official","last_updated":"2026-04-26","family":"bge","description":"BGE embedding is a general Embedding Model. It is pre-trained using retromae and trained on large-scale pair data using contrastive learning. Note that the goal of pre-training is to reconstruct the text, and the pre-trained model cannot be used for similarity calculation directly, it needs to be fine-tuned","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"BGE embedding is a general Embedding Model."},{"id":"BAAI/bge-en-icl","name":"bge-en-icl","created_by":"baai","source":"official","last_updated":"2026-04-26","family":"bge","description":"A LLM-based embedding model with in-context learning capabilities that achieves SOTA performance on BEIR and AIR-Bench. It leverages few-shot examples to enhance task performance.","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"A LLM-based embedding model with in-context learning capabilities that achieves SOTA performance on BEIR and AIR-Bench."},{"id":"BAAI/bge-large-en-v1.5","name":"bge-large-en-v1.5","created_by":"baai","source":"official","last_updated":"2026-04-26","family":"bge","description":"BGE embedding is a general Embedding Model. It is pre-trained using retromae and trained on large-scale pair data using contrastive learning. Note that the goal of pre-training is to reconstruct the text, and the pre-trained model cannot be used for similarity calculation directly, it needs to be fine-tuned","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"BGE embedding is a general Embedding Model."},{"id":"BAAI/bge-m3-multi","name":"bge-m3-multi","created_by":"baai","source":"official","last_updated":"2026-04-26","family":"bge","description":"BGE-M3 is a multilingual text embedding model developed by BAAI, distinguished by its Multi-Linguality (supporting 100+ languages), Multi-Functionality (unified dense, multi-vector, and sparse retrieval), and Multi-Granularity (handling inputs from short queries to 8192-token documents). It achieves state-of-the-art retrieval performance across diverse benchmarks while maintaining a single model for multiple retrieval modes.","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"BGE-M3 is a multilingual text embedding model developed by BAAI, distinguished by its Multi-Linguality (supporting 100+ languages), Multi-Functionality (unified dense, multi-vector, and sparse retrieval), and Multi-Granularity (handling inputs from short queries to 8192-token documents)."},{"id":"BAAI/bge-m3","name":"bge-m3","created_by":"baai","source":"official","last_updated":"2026-04-26","family":"bge","description":"BGE-M3 is a versatile text embedding model that supports multi-functionality, multi-linguality, and multi-granularity, allowing it to perform dense retrieval, multi-vector retrieval, and sparse retrieval in over 100 languages and with input sizes up to 8192 tokens. The model can be used in a retrieval pipeline with hybrid retrieval and re-ranking to achieve higher accuracy and stronger generalization capabilities. BGE-M3 has shown state-of-the-art performance on several benchmarks, including ...","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"quantization":"fp32","tagline":"BGE-M3 is a versatile text embedding model that supports multi-functionality, multi-linguality, and multi-granularity, allowing it to perform dense retrieval, multi-vector retrieval, and sparse retrieval in over 100 languages and with input sizes up to 8192 tokens."},{"id":"black-forest-labs/FLUX-1-dev","name":"FLUX-1-dev","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux","description":"FLUX.1-dev is a state-of-the-art 12 billion parameter rectified flow transformer developed by Black Forest Labs. This model excels in text-to-image generation, providing highly accurate and detailed outputs. It is particularly well-regarded for its ability to follow complex prompts and generate anatomically accurate images, especially with challenging details like hands and faces.","status":"active","model_type":"image","open_weight":true,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0090 per image unit (1024x1024 default)"],"tagline":"FLUX.1-dev is a state-of-the-art 12 billion parameter rectified flow transformer developed by Black Forest Labs."},{"id":"black-forest-labs/FLUX-1-Redux-dev","name":"FLUX-1-Redux-dev","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux","description":"FLUX.1 Redux [dev] is an image variation generation adapter for all FLUX.1 base models. It enables users to refine images with slight variations and supports text-based restyling via API. Integrated with FLUX1.1 [pro] Ultra, it allows for high-quality 4-megapixel outputs. The model can be used with Diffusers in Python for efficient image generation. While powerful, it has ethical and factual limitations and is governed by a non-commercial license.","status":"active","model_type":"image","open_weight":true,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0120 per image unit (1024x1024 default)"],"tagline":"FLUX.1 Redux [dev] is an image variation generation adapter for all FLUX.1 base models."},{"id":"black-forest-labs/FLUX-1-schnell","name":"FLUX-1-schnell","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux","description":"FLUX.1 [schnell] is a 12 billion parameter rectified flow transformer capable of generating images from text descriptions. This model offers cutting-edge output quality and competitive prompt following, matching the performance of closed source alternatives. Trained using latent adversarial diffusion distillation, FLUX.1 [schnell] can generate high-quality images in only 1 to 4 steps.","status":"active","model_type":"image","open_weight":true,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0005 per image unit (1024x1024 default)"],"tagline":"FLUX.1 [schnell] is a 12 billion parameter rectified flow transformer capable of generating images from text descriptions."},{"id":"black-forest-labs/FLUX-1.1-pro","name":"FLUX-1.1-pro","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux","description":"Black Forest Labs' latest state-of-the art proprietary model sporting top of the line prompt following, visual quality, details and output diversity.","status":"active","model_type":"image","open_weight":false,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Black Forest Labs' latest state-of-the art proprietary model sporting top of the line prompt following, visual quality, details and output diversity."},{"id":"black-forest-labs/FLUX-2-dev","name":"FLUX-2-dev","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux-2","description":"Brand-new Flux2 Dev introduces a faster, more modular architecture for next-generation image generation pipelines. It delivers improved performance, cleaner control APIs, and a significantly more flexible development workflow for custom inference setups.","status":"active","model_type":"image","open_weight":true,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0100 per image unit (1024x1024 default)"],"tagline":"Brand-new Flux2 Dev introduces a faster, more modular architecture for next-generation image generation pipelines."},{"id":"black-forest-labs/FLUX-2-klein-4b","name":"FLUX-2-klein-4b","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux-2","description":"The fastest model of the Flux 2 family. Frontier visual intelligence — state-of-the-art image generation and editing from Black Forest Labs","status":"active","model_type":"image","open_weight":true,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0140 per image unit (1024x1024 default)"],"tagline":"The fastest model of the Flux 2 family."},{"id":"black-forest-labs/FLUX-2-klein-9b","name":"FLUX-2-klein-9b","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux-2","description":"The best quality-to-latency ratio, production apps model of the Flux 2 family. Frontier visual intelligence — state-of-the-art image generation and editing from Black Forest Labs","status":"active","model_type":"image","open_weight":true,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0150 per image unit (1024x1024 default)"],"tagline":"The best quality-to-latency ratio, production apps model of the Flux 2 family."},{"id":"black-forest-labs/FLUX-2-max","name":"FLUX-2-max","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux-2","description":"The new top-tier image model from Black Forest Labs, significantly pushing image quality and editing consistency","status":"active","model_type":"image","open_weight":false,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.1000 per image unit (0x0 default)"],"tagline":"The new top-tier image model from Black Forest Labs, significantly pushing image quality and editing consistency"},{"id":"black-forest-labs/FLUX-2-pro","name":"FLUX-2-pro","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux-2","description":"Multi-reference visual intelligence with unprecedented detail, color precision, and spatial reasoning. The most advanced image generation and editing model. Generate photorealistic images with precise control.","status":"active","model_type":"image","open_weight":false,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0150 per image unit (0x0 default)"],"tagline":"Multi-reference visual intelligence with unprecedented detail, color precision, and spatial reasoning."},{"id":"black-forest-labs/FLUX-pro","name":"FLUX-pro","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux","description":"Black Forest Labs' first flagship model based on Flux latent rectified flow transformers","status":"active","model_type":"image","open_weight":false,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0500 per image unit (0x0 default)"],"tagline":"Black Forest Labs' first flagship model based on Flux latent rectified flow transformers"},{"id":"black-forest-labs/FLUX.1-Kontext-dev","name":"FLUX.1-Kontext-dev","created_by":"black-forest-labs","source":"official","last_updated":"2026-04-26","family":"flux","description":"FLUX.1 Kontext [dev] is a 12-billion-parameter image editing model that transforms visuals based on natural language instructions. It allows highly consistent, multi-step edits and is released with open weights under a non-commercial license to empower artists and researchers.","status":"active","model_type":"image","open_weight":true,"license":"flux","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0100 per image unit (1024x1024 default)"],"tagline":"FLUX.1 Kontext [dev] is a 12-billion-parameter image editing model that transforms visuals based on natural language instructions."},{"id":"bosonai/HiggsAudioV2.5","name":"HiggsAudioV2.5","created_by":"bosonai","source":"official","last_updated":"2026-04-26","family":"bosonai","description":"HiggsAudioV2.5 is a high-quality neural text-to-speech (TTS) model designed for natural-sounding voice generation across a wide range of use cases. It focuses on clarity, stable prosody, and consistent pacing, making it suitable for both short prompts and longer narration.","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$20.0000 per 1M input characters"],"tagline":"HiggsAudioV2.5 is a high-quality neural text-to-speech (TTS) model designed for natural-sounding voice generation across a wide range of use cases."},{"id":"Bria/blur_background","name":"blur_background","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria Blur Background softens and de-emphasizes image backgrounds while keeping the subject sharp and clear for professional-quality results. Trained fully on licensed data, it delivers safe, natural, and commercial-ready outputs.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria Blur Background softens and de-emphasizes image backgrounds while keeping the subject sharp and clear for professional-quality results."},{"id":"Bria/Bria-3.2-vector","name":"Bria-3.2-vector","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria 3.2 is the next-generation commercial-ready text-to-image model. With just 4 billion parameters, it provides exceptional aesthetics and text rendering, evaluated to be on par to leading open-source models, and outperforming other licensed models.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria 3.2 is the next-generation commercial-ready text-to-image model."},{"id":"Bria/Bria-3.2","name":"Bria-3.2","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria 3.2 is the next-generation commercial-ready text-to-image model. With just 4 billion parameters, it provides exceptional aesthetics and text rendering, evaluated to be on par to leading open-source models, and outperforming other licensed models.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria 3.2 is the next-generation commercial-ready text-to-image model."},{"id":"Bria/enhance","name":"enhance","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria Enhance improves overall image quality by sharpening details, balancing colors, and boosting clarity for crisp, professional visuals. Trained only on licensed data, it’s safe, reliable, and ready for commercial use.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria Enhance improves overall image quality by sharpening details, balancing colors, and boosting clarity for crisp, professional visuals."},{"id":"Bria/erase","name":"erase","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria Eraser enables precise removal of unwanted objects from images while maintaining high-quality outputs. Trained exclusively on licensed data for safe and risk-free commercial use","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria Eraser enables precise removal of unwanted objects from images while maintaining high-quality outputs."},{"id":"Bria/erase_foreground","name":"erase_foreground","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria Erase Foreground precisely removes main subjects or foreground objects from images. Built entirely on licensed data, it is safe and optimized for professional and commercial use.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria Erase Foreground precisely removes main subjects or foreground objects from images."},{"id":"Bria/expand","name":"expand","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria Expand expands images beyond their borders in high quality. Resizing the image by generating new pixels to expand to the desired aspect ratio. Trained exclusively on licensed data for safe and risk-free commercial use.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria Expand expands images beyond their borders in high quality."},{"id":"Bria/fibo","name":"fibo","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"FIBO is an open-source, JSON-native text-to-image model trained on detailed structured descriptions (over 1,000+ words per image), providing fine-grained control over light, composition, and camera parameters.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"FIBO is an open-source, JSON-native text-to-image model trained on detailed structured descriptions (over 1,000+ words per image), providing fine-grained control over light, composition, and camera pa"},{"id":"Bria/fibo_edit","name":"fibo_edit","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"🥳 For a limited time, Fibo Edit is free on DeepInfra 🥳 YOUR AI, YOUR RULES. Visual Generation for Production-Grade. FIBO Edit. An open-source image editing model with native masking and a lightweight 8B architecture.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"🥳 For a limited time, Fibo Edit is free on DeepInfra 🥳 YOUR AI, YOUR RULES."},{"id":"Bria/gen_fill","name":"gen_fill","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria GenFill enables high-quality object addition or visual transformation. Trained exclusively on licensed data for safe and risk-free commercial use.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria GenFill enables high-quality object addition or visual transformation."},{"id":"Bria/remove_background","name":"remove_background","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria RMBG 2.0 enables seamless removal of backgrounds from images, ideal for professional editing tasks. Trained exclusively on licensed data for safe and risk-free commercial use.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0180 per image unit (0x0 default)"],"tagline":"Bria RMBG 2.0 enables seamless removal of backgrounds from images, ideal for professional editing tasks."},{"id":"Bria/replace_background","name":"replace_background","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Bria Background Generation allows for efficient swapping of backgrounds in images via text prompts or reference image, delivering realistic and polished results. Trained exclusively on licensed data for safe and risk-free commercial use.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Bria Background Generation allows for efficient swapping of backgrounds in images via text prompts or reference image, delivering realistic and polished results."},{"id":"Bria/video_eraser","name":"video_eraser","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Remove unwanted objects or regions from video using a mask, reconstructs the background with intelligent content-aware fill.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Remove unwanted objects or regions from video using a mask, reconstructs the background with intelligent content-aware fill."},{"id":"Bria/video_foreground_mask","name":"video_foreground_mask","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Automatically identify and segment foreground objects across video frames and generate a mask. No prompts, just a video.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Automatically identify and segment foreground objects across video frames and generate a mask."},{"id":"Bria/video_increase_resolution","name":"video_increase_resolution","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Increase video resolution up to 8K with advanced AI upscaling. Bring your videos to the big screen, ready for the screens of tomorrow.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Increase video resolution up to 8K with advanced AI upscaling."},{"id":"Bria/video_mask_by_key_points","name":"video_mask_by_key_points","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Identify and segment objects across video frames using specific coordinate points. Just point in the right direction and the model will figure out by itself which object should be masked.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Identify and segment objects across video frames using specific coordinate points."},{"id":"Bria/video_mask_by_prompt","name":"video_mask_by_prompt","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Identify and segment objects across video frames using a text prompt. The easiest way to create a mask to modify your videos.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Identify and segment objects across video frames using a text prompt."},{"id":"Bria/video_remove_background","name":"video_remove_background","created_by":"bria","source":"official","last_updated":"2026-04-26","family":"bria","description":"Light and fast. Remove the background of your videos to bring the foreground elements to focus. No more unwanted distractions.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Light and fast."},{"id":"ByteDance/Seed-1.8","name":"Seed-1.8","created_by":"bytedance","source":"official","last_updated":"2026-04-26","family":"bytedance","description":"Optimized specifically for multimodal agent scenarios. It features enhanced agent capabilities, upgraded multimodal comprehension, and more flexible context management.","status":"active","model_type":"chat","context_window":256000,"reasoning_tokens":true,"open_weight":false,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":2,"cached_input":0.05},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Optimized specifically for multimodal agent scenarios."},{"id":"ByteDance/Seed-2.0-code","name":"Seed-2.0-code","created_by":"bytedance","source":"official","description":"A coding model optimized for real-world development environments, with reliable tool use in common IDEs such as Claude Code. It delivers strong front-end performance and supports Skills.","status":"active","context_window":256000,"model_type":"chat","reasoning_tokens":true,"license":"apache-2.0","open_weight":false,"tagline":"A coding model optimized for real-world development environments, with reliable tool use in common IDEs such as Claude Code.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.5,"output":3,"cached_input":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03"},{"id":"ByteDance/Seed-2.0-mini","name":"Seed-2.0-mini","created_by":"bytedance","source":"official","last_updated":"2026-04-26","family":"seed","description":"Built for low-latency, high-concurrency, cost-sensitive use cases, with flexible deployment, four-tier thinking, and multimodal","status":"active","model_type":"chat","context_window":256000,"reasoning_tokens":true,"open_weight":false,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.1,"output":0.4,"cached_input":0.02},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Built for low-latency, high-concurrency, cost-sensitive use cases, with flexible deployment, four-tier thinking, and multimodal"},{"id":"ByteDance/Seed-2.0-pro","name":"Seed-2.0-pro","created_by":"bytedance","source":"official","last_updated":"2026-04-26","family":"seed","description":"Built for the Agent era, it delivers stable performance in complex reasoning and long-horizon tasks, including multi-step planning, visual-text reasoning, video understanding, and advanced analysis.","status":"active","model_type":"chat","context_window":256000,"reasoning_tokens":true,"open_weight":false,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.5,"output":3,"cached_input":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Built for the Agent era, it delivers stable performance in complex reasoning and long-horizon tasks, including multi-step planning, visual-text reasoning, video understanding, and advanced analysis."},{"id":"ByteDance/Seedance-1.5-Pro","name":"Seedance-1.5-Pro","created_by":"bytedance","source":"official","last_updated":"2026-04-26","family":"bytedance","description":"ByteDance's Seedance 1.5 Pro is a professional video model using V2A native generation for integrated, synced audio-visual output, enhancing efficiency of professional video creation.","status":"active","model_type":"video","open_weight":false,"license":"apache-2.0","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"ByteDance's Seedance 1.5 Pro is a professional video model using V2A native generation for integrated, synced audio-visual output, enhancing efficiency of professional video creation."},{"id":"ByteDance/Seedance-2.0","name":"Seedance-2.0","created_by":"bytedance","source":"official","description":"A new-generation professional-grade multimodal video creation model developed, supports video generation with multimodal reference inputs including images, videos and audio.","status":"active","model_type":"video","license":"apache-2.0","open_weight":false,"tagline":"A new-generation professional-grade multimodal video creation model developed, supports video generation with multimodal reference inputs including images, videos and audio.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_updated":"2026-06-03","capabilities":{"vision":true,"fine_tuning":true}},{"id":"ByteDance/Seedream-4.5","name":"Seedream-4.5","created_by":"bytedance","source":"official","last_updated":"2026-04-26","family":"bytedance","description":"The latest image model, delivering better editing consistency, improved multi-image fusion, finer detail control, natural small text and faces, and harmonious, aesthetic visuals.","status":"active","model_type":"image","open_weight":false,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"The latest image model, delivering better editing consistency, improved multi-image fusion, finer detail control, natural small text and faces, and harmonious, aesthetic visuals."},{"id":"ByteDance/Seedream-4","name":"Seedream-4","created_by":"bytedance","source":"official","last_updated":"2026-04-26","family":"bytedance","description":"Seedream 4.0 is a SOTA multimodal image creation model built on leading architecture. It breaks through the boundaries of traditional text-to-image models by natively supporting text, single-image, and multi-image inputs. Users can freely combine text and images to achieve diverse creative modes within a single model—such as multi-image blending, image editing, and sequentially batch image generation, featuring subject consistency, making image creation more free and controllable.","status":"active","model_type":"image","open_weight":false,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0400 per image unit (0x0 default)"],"tagline":"Seedream 4.0 is a SOTA multimodal image creation model built on leading architecture."},{"id":"canopylabs/orpheus-3b-0.1-ft","name":"orpheus-3b-0.1-ft","created_by":"canopylabs","source":"official","last_updated":"2026-04-26","family":"canopylabs","description":"Orpheus TTS is a state-of-the-art, Llama-based Speech-LLM designed for high-quality, empathetic text-to-speech generation. This model has been finetuned to deliver human-level speech synthesis, achieving exceptional clarity, expressiveness, and real-time streaming performances.","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$7.0000 per 1M input characters"],"tagline":"Orpheus TTS is a state-of-the-art, Llama-based Speech-LLM designed for high-quality, empathetic text-to-speech generation."},{"id":"ClarityAI/creative","name":"creative","created_by":"clarityai","source":"official","last_updated":"2026-04-26","family":"clarityai","description":"ClarityAI/creative is an AI-powered image upscaler that enhances details, adds realism, and creatively modifies images to improve their quality and visual appeal.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0500 per image unit (0x0 default)"],"tagline":"ClarityAI/creative is an AI-powered image upscaler that enhances details, adds realism, and creatively modifies images to improve their quality and visual appeal."},{"id":"ClarityAI/crystal","name":"crystal","created_by":"clarityai","source":"official","last_updated":"2026-04-26","family":"clarityai","description":"ClarityAI/crystal is a specialized upscaler optimized for portraits, faces, and products, delivering high-precision enhancements with adjustable detail levels for sharp, natural results.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0500 per image unit (0x0 default)"],"tagline":"ClarityAI/crystal is a specialized upscaler optimized for portraits, faces, and products, delivering high-precision enhancements with adjustable detail levels for sharp, natural results."},{"id":"ClarityAI/flux","name":"flux","created_by":"clarityai","source":"official","last_updated":"2026-04-26","family":"flux","description":"ClarityAI/flux integrates the Flux AI model into the upscaling process, enabling high-resolution enhancements with superior face preservation and support for LoRAs to apply specific styles or identities.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.2000 per image unit (0x0 default)"],"tagline":"ClarityAI/flux integrates the Flux AI model into the upscaling process, enabling high-resolution enhancements with superior face preservation and support for LoRAs to apply specific styles or identiti"},{"id":"deepreinforce-ai/Ornith-1.0-35B","name":"Ornith-1.0-35B","created_by":"deepreinforce-ai","source":"official","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.14,"output":1,"cached_input":0.05},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","last_updated":"2026-06-30","description":"Ornith-1.0-35B is DeepReinforce's open (MIT-licensed) agentic-coding model: an RL post-train of Qwen3.5-35B-A3B, a 35B-total / ~3B-active Mixture-of-Experts with hybrid Gated-DeltaNet attention. It targets state-of-the-art open-model coding-agent performance (SWE-bench Verified 75.6, Terminal-Bench 2.1 64.2) with a 262K-token context, thinking/reasoning mode, tool calling, and image + video understanding.","tagline":"Ornith-1.0-35B is DeepReinforce's open (MIT-licensed) agentic-coding model: an RL post-train of Qwen3.5-35B-A3B, a 35B-total / ~3B-active Mixture-of-Experts with hybrid Gated-DeltaNet attention."},{"id":"deepseek-ai/DeepSeek-R1-0528-Turbo","name":"DeepSeek-R1-0528-Turbo","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-r1","description":"The DeepSeek R1 0528 turbo model is a state of the art reasoning model that can generate very quick responses","status":"active","model_type":"chat","context_window":32768,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1,"output":3},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"The DeepSeek R1 0528 turbo model is a state of the art reasoning model that can generate very quick responses"},{"id":"deepseek-ai/DeepSeek-R1-0528","name":"DeepSeek-R1-0528","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-r1","description":"The DeepSeek R1 model has undergone a minor version upgrade, with the current version being DeepSeek-R1-0528.","status":"active","model_type":"chat","context_window":163840,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.5,"output":2.15,"cached_input":0.35},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"The DeepSeek R1 model has undergone a minor version upgrade, with the current version being DeepSeek-R1-0528."},{"id":"deepseek-ai/DeepSeek-R1-Distill-Llama-70B","name":"DeepSeek-R1-Distill-Llama-70B","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"llama","description":"DeepSeek-R1-Distill-Llama-70B is a highly efficient language model that leverages knowledge distillation to achieve state-of-the-art performance. This model distills the reasoning patterns of larger models into a smaller, more agile architecture, resulting in exceptional results on benchmarks like AIME 2024, MATH-500, and LiveCodeBench. With 70 billion parameters, DeepSeek-R1-Distill-Llama-70B offers a unique balance of accuracy and efficiency, making it an ideal choice for a wide range of na...","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"license":"deepseek","capabilities":{"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.7,"output":0.8},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"DeepSeek-R1-Distill-Llama-70B is a highly efficient language model that leverages knowledge distillation to achieve state-of-the-art performance."},{"id":"deepseek-ai/DeepSeek-V3-0324","name":"DeepSeek-V3-0324","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-v3","description":"DeepSeek-V3-0324, a strong Mixture-of-Experts (MoE) language model with 671B total parameters with 37B activated for each token, an improved iteration over DeepSeek-V3.","status":"active","model_type":"chat","context_window":163840,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.2,"output":0.77,"cached_input":0.135},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"DeepSeek-V3-0324, a strong Mixture-of-Experts (MoE) language model with 671B total parameters with 37B activated for each token, an improved iteration over DeepSeek-V3."},{"id":"deepseek-ai/DeepSeek-V3.1-Terminus","name":"DeepSeek-V3.1-Terminus","created_by":"deepseek","source":"official","last_updated":"2026-06-03","family":"deepseek-v3","description":"DeepSeek-V3.1 Terminus is an update to DeepSeek V3.1 that maintains the model's original capabilities while addressing issues reported by users, including language consistency and agent capabilities, further optimizing the model's performance in coding and search agents. It is a large hybrid reasoning model (671B parameters, 37B active) that supports both thinking and non-thinking modes. It extends the DeepSeek-V3 base with a two-phase long-context training process. Users can control the reas...","status":"active","model_type":"chat","context_window":163840,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.27,"output":0.95,"cached_input":0.13},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"DeepSeek-V3.1 Terminus is an update to DeepSeek V3.1 that maintains the model's original capabilities while addressing issues reported by users, including language consistency and agent capabilities, further optimizing the model's performance in coding and search agents."},{"id":"deepseek-ai/DeepSeek-V3.1","name":"DeepSeek-V3.1","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-v3","description":"DeepSeek-V3.1 is post-trained on the top of DeepSeek-V3.1-Base, which is built upon the original V3 base checkpoint through a two-phase long context extension approach, following the methodology outlined in the original DeepSeek-V3 report. We have expanded our dataset by collecting additional long documents and substantially extending both training phases. The 32K extension phase has been increased 10-fold to 630B tokens, while the 128K extension phase has been extended by 3.3x to 209B tokens...","status":"active","model_type":"chat","context_window":163840,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.21,"output":0.79,"cached_input":0.13},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"DeepSeek-V3.1 is post-trained on the top of DeepSeek-V3.1-Base, which is built upon the original V3 base checkpoint through a two-phase long context extension approach, following the methodology outlined in the original DeepSeek-V3 report."},{"id":"deepseek-ai/DeepSeek-V3.2","name":"DeepSeek-V3.2","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-v3","description":"DeepSeek-V3.2 is a large language model designed to harmonize high computational efficiency with strong reasoning and agentic tool-use performance. It introduces DeepSeek Sparse Attention (DSA), a fine-grained sparse attention mechanism that reduces training and inference cost while preserving quality in long-context scenarios. A scalable reinforcement learning post-training framework further improves reasoning, with reported performance in the GPT-5 class, and the model has demonstrated gold...","status":"active","model_type":"chat","context_window":163840,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.26,"output":0.38,"cached_input":0.13},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"DeepSeek-V3.2 is a large language model designed to harmonize high computational efficiency with strong reasoning and agentic tool-use performance."},{"id":"deepseek-ai/DeepSeek-V3","name":"DeepSeek-V3","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-v3","description":"DeepSeek-V3, a strong Mixture-of-Experts (MoE) language model with 671B total parameters with 37B activated for each token. To achieve efficient inference and cost-effective training, DeepSeek-V3 adopts Multi-head Latent Attention (MLA) and DeepSeekMoE architectures, which were thoroughly validated in DeepSeek-V2.","status":"active","model_type":"chat","context_window":163840,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.32,"output":0.89},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"DeepSeek-V3, a strong Mixture-of-Experts (MoE) language model with 671B total parameters with 37B activated for each token."},{"id":"deepseek-ai/DeepSeek-V4-Flash","name":"DeepSeek-V4-Flash","created_by":"deepseek","source":"official","last_updated":"2026-06-03","family":"deepseek-v4","description":"DeepSeek V4 Flash is an efficiency-focused MoE model with 284B total parameters (13B active) and a 1M-token context window. It's tuned for fast inference and high-throughput use cases while still holding up on reasoning and coding tasks.","status":"active","model_type":"chat","context_window":1048576,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.1,"output":0.2,"cached_input":0.02},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"DeepSeek V4 Flash is an efficiency-focused MoE model with 284B total parameters (13B active) and a 1M-token context window.","reasoning_tokens":true,"max_output_tokens":384000},{"id":"deepseek-ai/DeepSeek-V4-Pro","name":"DeepSeek-V4-Pro","created_by":"deepseek","source":"official","last_updated":"2026-06-03","family":"deepseek-v4","description":"DeepSeek V4 Pro is an MoE model with 1.6T total parameters (49B active) and a 1M-token context window. It's built for advanced reasoning, coding, and long-running agent tasks, and performs well on knowledge, math, and software engineering benchmarks.","status":"active","model_type":"chat","context_window":1048576,"open_weight":true,"license":"deepseek","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1.3,"output":2.6,"cached_input":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"DeepSeek V4 Pro is an MoE model with 1.6T total parameters (49B active) and a 1M-token context window.","max_output_tokens":384000},{"id":"deepseek-ai/Janus-Pro-1B","name":"Janus-Pro-1B","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-ai","description":"Janus-Pro is a novel autoregressive framework that unifies multimodal understanding and generation. It addresses the limitations of previous approaches by decoupling visual encoding into separate pathways, while still utilizing a single, unified transformer architecture for processing. The decoupling not only alleviates the conflict between the visual encoder’s roles in understanding and generation, but also enhances the framework’s flexibility. Janus-Pro surpasses previous unified model and ...","status":"active","model_type":"image","open_weight":true,"license":"deepseek","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0005 per image unit (0x0 default)"],"tagline":"Janus-Pro is a novel autoregressive framework that unifies multimodal understanding and generation."},{"id":"deepseek-ai/Janus-Pro-7B","name":"Janus-Pro-7B","created_by":"deepseek","source":"official","last_updated":"2026-04-26","family":"deepseek-ai","description":"Janus-Pro is a novel autoregressive framework that unifies multimodal understanding and generation. It addresses the limitations of previous approaches by decoupling visual encoding into separate pathways, while still utilizing a single, unified transformer architecture for processing. The decoupling not only alleviates the conflict between the visual encoder’s roles in understanding and generation, but also enhances the framework’s flexibility. Janus-Pro surpasses previous unified model and ...","status":"active","model_type":"image","open_weight":true,"license":"deepseek","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0020 per image unit (0x0 default)"],"tagline":"Janus-Pro is a novel autoregressive framework that unifies multimodal understanding and generation."},{"id":"FastVideo/LTX-2.3-Distilled-Diffusers","name":"LTX-2.3-Distilled-Diffusers","created_by":"fastvideo","source":"official","description":"A fast, step-distilled build of Lightricks' LTX-2.3 diffusion-transformer video model (distilled by FastVideo). Generates high-fidelity text-to-video and image-to-video in just a few denoising steps.","status":"active","model_type":"video","open_weight":true,"tagline":"A fast, step-distilled build of Lightricks' LTX-2.3 diffusion-transformer video model (distilled by FastVideo).","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_updated":"2026-06-29"},{"id":"FastVideo/LTX2-Distilled-Diffusers","name":"LTX2-Distilled-Diffusers","created_by":"fastvideo","source":"official","description":"LTX-2 is a DiT-based audio-video foundation model designed to generate synchronized video and audio within a single model. It brings together the core building blocks of modern video generation, with open weights and a focus on practical, local execution.","status":"active","model_type":"video","open_weight":true,"tagline":"LTX-2 is a DiT-based audio-video foundation model designed to generate synchronized video and audio within a single model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_updated":"2026-06-03"},{"id":"google/embeddinggemma-300m","name":"embeddinggemma-300m","created_by":"google","source":"official","last_updated":"2026-06-29","family":"embed","description":"EmbeddingGemma is a 300M parameter multilingual open embedding model from Google DeepMind, designed for efficient deployment even on low-resource devices, producing high-quality text vector representations for tasks such as search, classification, clustering, and semantic similarity.","status":"active","model_type":"embed","open_weight":true,"license":"gemma","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"ChatGPT said: EmbeddingGemma is a 300M parameter multilingual open embedding model from Google DeepMind, designed for efficient deployment even on low-resource devices, producing high-quality text vec"},{"id":"google/gemini-2.5-flash","name":"gemini-2.5-flash","created_by":"google","source":"official","last_updated":"2026-04-26","family":"gemini-2.5","description":"Gemini 2.5 Flash is Google's latest thinking model, designed to tackle increasingly complex problems. It's capable of reasoning through their thoughts before responding, resulting in enhanced performance and improved accuracy. Gemini 2.5 Flash: best for balancing reasoning and speed.","status":"active","model_type":"chat","context_window":1000000,"reasoning_tokens":true,"open_weight":false,"license":"gemma","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.3,"output":2.5},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Gemini 2.5 Flash is Google's latest thinking model, designed to tackle increasingly complex problems.","max_output_tokens":65536,"knowledge_cutoff":"2025-01"},{"id":"google/gemini-2.5-pro","name":"gemini-2.5-pro","created_by":"google","source":"official","last_updated":"2026-04-26","family":"gemini-2.5","description":"Gemini 2.5 Pro is Google's the most advanced thinking model, designed to tackle increasingly complex problems. Gemini 2.5 Pro leads common benchmarks by meaningful margins and showcases strong reasoning and code capabilities. Gemini 2.5 models are thinking models, capable of reasoning through their thoughts before responding, resulting in enhanced performance and improved accuracy. The Gemini 2.5 Pro model is now available on DeepInfra.","status":"active","model_type":"chat","context_window":1000000,"reasoning_tokens":true,"open_weight":false,"license":"gemma","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":10},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"Gemini 2.5 Pro is Google's the most advanced thinking model, designed to tackle increasingly complex problems.","max_output_tokens":65536,"knowledge_cutoff":"2025-01"},{"id":"google/gemini-3-pro-image","name":"gemini-3-pro-image","created_by":"google","source":"official","family":"gemini-3","description":"Nano Banana Pro (Gemini 3 Pro Image) is designed to tackle the most challenging image generation by incorporating state-of-the-art reasoning capabilities. It is the best model for complex and multi-turn image generation and editing.","status":"active","model_type":"image","license":"gemma","open_weight":false,"tagline":"Nano Banana Pro (Gemini 3 Pro Image) is designed to tackle the most challenging image generation by incorporating state-of-the-art reasoning capabilities.","capabilities":{"streaming":true,"fine_tuning":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_updated":"2026-06-03","context_window":65536,"max_output_tokens":32768,"knowledge_cutoff":"2025-01"},{"id":"google/gemini-3.1-flash-lite","name":"gemini-3.1-flash-lite","created_by":"google","source":"official","family":"gemini-3.1","description":"Bring any idea to life with state-of-the-art reasoning to help you learn, build, and plan anything. Best for high-volume tasks that need efficiency and intelligence.","status":"active","context_window":1000000,"model_type":"chat","reasoning_tokens":true,"license":"gemma","open_weight":false,"tagline":"Bring any idea to life with state-of-the-art reasoning to help you learn, build, and plan anything.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":1.5},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03","max_output_tokens":65536,"knowledge_cutoff":"2025-01"},{"id":"google/gemini-3.1-pro","name":"gemini-3.1-pro","created_by":"google","source":"official","family":"gemini-3.1","description":"Bring any idea to life with state-of-the-art reasoning to help you learn, build, and plan anything. Best for complex tasks and bringing creative concepts to life.","status":"active","context_window":1000000,"model_type":"chat","reasoning_tokens":true,"license":"gemma","open_weight":false,"tagline":"Bring any idea to life with state-of-the-art reasoning to help you learn, build, and plan anything.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":2,"output":12},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03"},{"id":"google/gemini-3.5-flash","name":"gemini-3.5-flash","created_by":"google","source":"official","family":"gemini-3.5","description":"Gemini 3.5 Flash delivers near-Pro intelligence at Flash-tier cost and speed: Pro-level coding proficiency, parallel agentic execution, all at a much lower price.","status":"active","context_window":1000000,"model_type":"chat","reasoning_tokens":true,"license":"gemma","open_weight":false,"tagline":"Gemini 3.5 Flash delivers near-Pro intelligence at Flash-tier cost and speed: Pro-level coding proficiency, parallel agentic execution, all at a much lower price.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.5,"output":9},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03","max_output_tokens":65536,"knowledge_cutoff":"2025-01"},{"id":"google/gemma-3-12b-it","name":"gemma-3-12b-it","created_by":"google","source":"official","last_updated":"2026-06-10","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3-12B is Google's latest open source model, successor to Gemma 2","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"license":"gemma","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.05,"output":0.15},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs."},{"id":"google/gemma-3-27b-it","name":"gemma-3-27b-it","created_by":"google","source":"official","last_updated":"2026-04-26","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3 27B is Google's latest open source model, successor to Gemma 2","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"license":"gemma","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.08,"output":0.16},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs."},{"id":"google/gemma-3-4b-it","name":"gemma-3-4b-it","created_by":"google","source":"official","last_updated":"2026-06-10","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3-12B is Google's latest open source model, successor to Gemma 2","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"license":"gemma","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.05,"output":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs."},{"id":"google/gemma-4-26B-A4B-it","name":"gemma-4-26B-A4B-it","created_by":"google","source":"official","last_updated":"2026-04-26","family":"gemma-4","description":"Efficient, MoE variant of Gemma 4. Gemma is a family of open models built by Google DeepMind. Gemma 4 models are multimodal, handling text and image input and generating text output.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"gemma","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.07,"output":0.34},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Efficient, MoE variant of Gemma 4."},{"id":"google/gemma-4-31B-it-turbo","name":"gemma-4-31B-it-turbo","created_by":"google","source":"official","family":"gemma-4","description":"Gemma is a family of open models built by Google DeepMind. Gemma 4 models are multimodal, handling text and image input and generating text output.","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"license":"gemma","open_weight":true,"tagline":"Gemma is a family of open models built by Google DeepMind.","capabilities":{"tool_call":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.12,"output":0.37},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","last_updated":"2026-06-03"},{"id":"google/gemma-4-31B-it","name":"gemma-4-31B-it","created_by":"google","source":"official","last_updated":"2026-04-26","family":"gemma-4","description":"Gemma is a family of open models built by Google DeepMind. Gemma 4 models are multimodal, handling text and image input and generating text output.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"gemma","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.13,"output":0.38},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Gemma is a family of open models built by Google DeepMind."},{"id":"google/veo-3.0-fast","name":"veo-3.0-fast","created_by":"google","source":"official","last_updated":"2026-04-26","family":"veo-3.0","description":"Veo 3 Fast is a speed-optimized version of the Veo 3 model, designed for rapid video creation. While maintaining high quality, it delivers results in a fraction of the time, making it ideal for quick iterations and dynamic content generation.","status":"active","model_type":"video","open_weight":false,"license":"gemma","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Veo 3 Fast is a speed-optimized version of the Veo 3 model, designed for rapid video creation."},{"id":"google/veo-3.0","name":"veo-3.0","created_by":"google","source":"official","last_updated":"2026-04-26","family":"veo-3.0","description":"Veo 3 is a state-of-the-art text-to-video model from Google that generates high-fidelity, cinematic videos with synchronized audio from a simple text prompt. It excels at creating realistic and imaginative scenes with a deep understanding of natural language and visual dynamics.","status":"active","model_type":"video","open_weight":false,"license":"gemma","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Veo 3 is a state-of-the-art text-to-video model from Google that generates high-fidelity, cinematic videos with synchronized audio from a simple text prompt."},{"id":"google/veo-3.1-fast","name":"veo-3.1-fast","created_by":"google","source":"official","last_updated":"2026-04-26","family":"veo-3.1","description":"Veo 3.1 is the latest text-to-video model from Google that generates high-fidelity, cinematic videos with synchronized audio from a simple text prompt. It excels at creating realistic and imaginative scenes with a deep understanding of natural language and visual dynamics.","status":"active","model_type":"video","open_weight":false,"license":"gemma","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Veo 3.1 is the latest text-to-video model from Google that generates high-fidelity, cinematic videos with synchronized audio from a simple text prompt."},{"id":"google/veo-3.1","name":"veo-3.1","created_by":"google","source":"official","last_updated":"2026-04-26","family":"veo-3.1","description":"Veo 3.1 is the latest text-to-video model from Google that generates high-fidelity, cinematic videos with synchronized audio from a simple text prompt. It excels at creating realistic and imaginative scenes with a deep understanding of natural language and visual dynamics.","status":"active","model_type":"video","open_weight":false,"license":"gemma","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"Veo 3.1 is the latest text-to-video model from Google that generates high-fidelity, cinematic videos with synchronized audio from a simple text prompt."},{"id":"Gryphe/MythoMax-L2-13b","name":"MythoMax-L2-13b","created_by":"gryphe","source":"official","last_updated":"2026-04-26","family":"gryphe","status":"active","model_type":"chat","context_window":4096,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.4,"output":0.4},"endpoints":["chat_completions"],"quantization":"fp16"},{"id":"hexgrad/Kokoro-82M","name":"Kokoro-82M","created_by":"hexgrad","source":"official","last_updated":"2026-04-26","family":"hexgrad","description":"Kokoro is an open-weight TTS model with 82 million parameters. Despite its lightweight architecture, it delivers comparable quality to larger models while being significantly faster and more cost-efficient. With Apache-licensed weights, Kokoro can be deployed anywhere from production environments to personal projects.","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$0.6200 per 1M input characters"],"tagline":"Kokoro is an open-weight TTS model with 82 million parameters."},{"id":"intfloat/e5-base-v2","name":"e5-base-v2","created_by":"intfloat","source":"official","last_updated":"2026-04-26","family":"e5","description":"Text Embeddings by Weakly-Supervised Contrastive Pre-training. Model has 24 layers and 1024 out dim.","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"Text Embeddings by Weakly-Supervised Contrastive Pre-training."},{"id":"intfloat/e5-large-v2","name":"e5-large-v2","created_by":"intfloat","source":"official","last_updated":"2026-04-26","family":"e5","description":"Text Embeddings by Weakly-Supervised Contrastive Pre-training. Model has 24 layers and 1024 out dim.","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"Text Embeddings by Weakly-Supervised Contrastive Pre-training."},{"id":"intfloat/multilingual-e5-large-instruct","name":"multilingual-e5-large-instruct","created_by":"intfloat","source":"official","last_updated":"2026-04-26","family":"e5","description":"The Multilingual-E5 models, initialized from XLM-RoBERTa, support up to 512 tokens per input — any longer text will be silently truncated. To ensure optimal performance, always prefix inputs with “query:” or “passage:”, as the model was explicitly trained with this format.","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The Multilingual-E5 models, initialized from XLM-RoBERTa, support up to 512 tokens per input — any longer text will be silently truncated."},{"id":"intfloat/multilingual-e5-large","name":"multilingual-e5-large","created_by":"intfloat","source":"official","last_updated":"2026-04-26","family":"e5","description":"The Multilingual-E5-large model is a 24-layer text embedding model with an embedding size of 1024, trained on a mixture of multilingual datasets and supporting 100 languages.","status":"active","model_type":"embed","open_weight":true,"license":"mit","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"quantization":"fp32","tagline":"The Multilingual-E5-large model is a 24-layer text embedding model with an embedding size of 1024, trained on a mixture of multilingual datasets and supporting 100 languages."},{"id":"inworld-ai/inworld-tts-1.5-max","name":"inworld-tts-1.5-max","created_by":"inworld-ai","source":"official","last_updated":"2026-04-26","family":"inworld-ai","description":"High-quality multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages. Supports voice cloning, word-level timestamps, and streaming. Optimized for natural, expressive speech with <250ms time-to-first-audio.","status":"active","model_type":"tts","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$50.0000 per 1M input characters"],"tagline":"High-quality multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages."},{"id":"inworld-ai/inworld-tts-1.5-mini","name":"inworld-tts-1.5-mini","created_by":"inworld-ai","source":"official","last_updated":"2026-04-26","family":"inworld-ai","description":"Fast multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages. Supports voice cloning, word-level timestamps, and streaming. Optimized for low-latency applications with <130ms time-to-first-audio.","status":"active","model_type":"tts","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$25.0000 per 1M input characters"],"tagline":"Fast multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages."},{"id":"inworld-ai/realtime-tts-1.5-max","name":"realtime-tts-1.5-max","created_by":"inworld-ai","source":"official","description":"High-quality multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages. Supports voice cloning, word-level timestamps, and streaming. Optimized for natural, expressive speech with <250ms time-to-first-audio.","status":"active","model_type":"tts","open_weight":false,"tagline":"High-quality multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$50.0000 per 1M input characters"],"last_updated":"2026-06-03"},{"id":"inworld-ai/realtime-tts-1.5-mini","name":"realtime-tts-1.5-mini","created_by":"inworld-ai","source":"official","description":"Fast multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages. Supports voice cloning, word-level timestamps, and streaming. Optimized for low-latency applications with <130ms time-to-first-audio.","status":"active","model_type":"tts","open_weight":false,"tagline":"Fast multilingual text-to-speech model by Inworld AI with 130+ preset voices across 15 languages.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$25.0000 per 1M input characters"],"last_updated":"2026-06-03"},{"id":"inworld-ai/realtime-tts-2","name":"realtime-tts-2","created_by":"inworld-ai","source":"official","description":"Realtime TTS 2.0 is a low-latency text-to-speech model with natural language steering, allowing you to control tone and emotion directly in the prompt (e.g., “[be happy and upbeat] Hello!”). It supports cross-lingual voices and multiple languages, enabling the same voice to speak consistently across different languages. This is an early access preview ahead of full launch, with ongoing improvements to voice quality and steering.","status":"active","model_type":"tts","open_weight":false,"tagline":"Realtime TTS 2.0 is a low-latency text-to-speech model with natural language steering, allowing you to control tone and emotion directly in the prompt (e.g., “[be happy and upbeat] Hello!”).","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$35.0000 per 1M input characters"],"last_updated":"2026-06-03"},{"id":"meta-llama/Llama-3.2-11B-Vision-Instruct","name":"Llama-3.2-11B-Vision-Instruct","created_by":"meta","source":"official","last_updated":"2026-06-10","family":"Llama-3.2","description":"Llama 3.2 11B Vision is a multimodal model with 11 billion parameters, designed to handle tasks combining visual and textual data. It excels in tasks such as image captioning and visual question answering, bridging the gap between language generation and visual reasoning. Pre-trained on a massive dataset of image-text pairs, it performs well in complex, high-accuracy image analysis. Its ability to integrate visual understanding with language processing makes it an ideal solution for industrie...","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.345,"output":0.345},"endpoints":["chat_completions"],"quantization":"fp8","license":"llama","tagline":"Llama 3.2 11B Vision is a multimodal model with 11 billion parameters, designed to handle tasks combining visual and textual data.","max_output_tokens":131072,"knowledge_cutoff":"2023-12","parameters":11},{"id":"meta-llama/Llama-3.3-70B-Instruct-Turbo","name":"Llama-3.3-70B-Instruct-Turbo","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"Llama-3.3","description":"Llama 3.3-70B Turbo is a highly optimized version of the Llama 3.3-70B model, utilizing FP8 quantization to deliver significantly faster inference speeds with a minor trade-off in accuracy. The model is designed to be helpful, safe, and flexible, with a focus on responsible deployment and mitigating potential risks such as bias, toxicity, and misinformation. It achieves state-of-the-art performance on various benchmarks, including conversational tasks, language translation, and text generation.","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.1,"output":0.32},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","license":"llama","tagline":"Llama 3.3-70B Turbo is a highly optimized version of the Llama 3.3-70B model, utilizing FP8 quantization to deliver significantly faster inference speeds with a minor trade-off in accuracy."},{"id":"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8","name":"Llama-4-Maverick-17B-128E-Instruct-FP8","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"Llama-4","description":"The Llama 4 collection of models are natively multimodal AI models that enable text and multimodal experiences. These models leverage a mixture-of-experts architecture to offer industry-leading performance in text and image understanding. Llama 4 Maverick, a 17 billion parameter model with 128 experts","status":"active","model_type":"chat","context_window":1048576,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.15,"output":0.6},"endpoints":["chat_completions"],"quantization":"fp8","license":"llama","tagline":"The Llama 4 collection of models are natively multimodal AI models that enable text and multimodal experiences.","max_output_tokens":16384,"parameters":402},{"id":"meta-llama/Llama-4-Scout-17B-16E-Instruct","name":"Llama-4-Scout-17B-16E-Instruct","created_by":"meta","source":"official","last_updated":"2026-06-10","family":"Llama-4","description":"The Llama 4 collection of models are natively multimodal AI models that enable text and multimodal experiences. These models leverage a mixture-of-experts architecture to offer industry-leading performance in text and image understanding. Llama 4 Scout, a 17 billion parameter model with 16 experts","status":"active","model_type":"chat","context_window":327680,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.1,"output":0.3},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","license":"llama","tagline":"The Llama 4 collection of models are natively multimodal AI models that enable text and multimodal experiences.","max_output_tokens":16384,"parameters":109},{"id":"meta-llama/Llama-Guard-4-12B","name":"Llama-Guard-4-12B","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"llama-guard","description":"Llama Guard 4 is a natively multimodal safety classifier with 12 billion parameters trained jointly on text and multiple images. Llama Guard 4 is a dense architecture pruned from the Llama 4 Scout pre-trained model and fine-tuned for content safety classification. Similar to previous versions, it can be used to classify content in both LLM inputs (prompt classification) and in LLM responses (response classification). It itself acts as an LLM: it generates text in its output that indicates whe...","status":"active","model_type":"chat","context_window":163840,"open_weight":true,"capabilities":{"vision":true,"streaming":true,"fine_tuning":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.18,"output":0.18},"endpoints":["chat_completions"],"quantization":"bfloat16","license":"llama","tagline":"Llama Guard 4 is a natively multimodal safety classifier with 12 billion parameters trained jointly on text and multiple images.","parameters":12},{"id":"meta-llama/Meta-Llama-3-8B-Instruct","name":"Meta-Llama-3-8B-Instruct","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"Llama-3","description":"Meta developed and released the Meta Llama 3 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8 and 70B sizes.","status":"active","model_type":"chat","context_window":8192,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.03,"output":0.04},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","license":"llama","tagline":"Meta developed and released the Meta Llama 3 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8 and 70B sizes.","max_output_tokens":8192,"parameters":8},{"id":"meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo","name":"Meta-Llama-3.1-70B-Instruct-Turbo","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"Llama-3.1","description":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.4,"output":0.4},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","license":"llama","tagline":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes"},{"id":"meta-llama/Meta-Llama-3.1-70B-Instruct","name":"Meta-Llama-3.1-70B-Instruct","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"Llama-3.1","description":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.4,"output":0.4},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","license":"llama","tagline":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes"},{"id":"meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo","name":"Meta-Llama-3.1-8B-Instruct-Turbo","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"Llama-3.1","description":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"tool_call":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.02,"output":0.03},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","license":"llama","tagline":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes"},{"id":"meta-llama/Meta-Llama-3.1-8B-Instruct","name":"Meta-Llama-3.1-8B-Instruct","created_by":"meta","source":"official","last_updated":"2026-04-26","family":"Llama-3.1","description":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.02,"output":0.05},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","license":"llama","tagline":"Meta developed and released the Meta Llama 3.1 family of large language models (LLMs), a collection of pretrained and instruction tuned generative text models in 8B, 70B and 405B sizes"},{"id":"microsoft/phi-4","name":"phi-4","created_by":"microsoft","source":"official","last_updated":"2026-04-26","family":"phi-4","description":"Phi-4 is a model built upon a blend of synthetic datasets, data from filtered public domain websites, and acquired academic books and Q&A datasets. The goal of this approach was to ensure that small capable models were trained with data focused on high quality and advanced reasoning.","status":"active","model_type":"chat","context_window":16384,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.07,"output":0.14},"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"Phi-4 is a model built upon a blend of synthetic datasets, data from filtered public domain websites, and acquired academic books and Q&A datasets."},{"id":"MiniMaxAI/MiniMax-M2.5","name":"MiniMax-M2.5","created_by":"minimax","source":"official","last_updated":"2026-04-26","family":"minimax","description":"MiniMax M2.5 is SOTA in coding, agentic tool use and search, office work, and a range of other economically valuable tasks, boasting scores of 80.2% in SWE-Bench Verified, 51.3% in Multi-SWE-Bench, and 76.3% in BrowseComp (with context management).","status":"active","model_type":"chat","context_window":196608,"reasoning_tokens":true,"open_weight":true,"license":"minimax","capabilities":{"tool_call":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.15,"output":1.15,"cached_input":0.03},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"MiniMax M2.5 is SOTA in coding, agentic tool use and search, office work, and a range of other economically valuable tasks, boasting scores of 80.2% in SWE-Bench Verified, 51.3% in Multi-SWE-Bench, an"},{"id":"MiniMaxAI/MiniMax-M2.7-Turbo","name":"MiniMax-M2.7-Turbo","created_by":"minimax","source":"official","family":"minimax","description":"Speed-optimized MiniMax-M2.7","status":"active","context_window":196608,"model_type":"chat","reasoning_tokens":true,"license":"minimax","open_weight":false,"tagline":"Speed-optimized MiniMax-M2.7","capabilities":{"tool_call":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.4,"output":2},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","last_updated":"2026-06-30"},{"id":"MiniMaxAI/MiniMax-M2.7","name":"MiniMax-M2.7","created_by":"minimax","source":"official","family":"minimax","description":"MiniMax-M2.7 is MiniMax's first model deeply participating in its own evolution. M2.7 is capable of building complex agent harnesses and completing highly elaborate productivity tasks, leveraging Agent Teams, complex Skills, and dynamic tool search.","status":"active","context_window":196608,"model_type":"chat","reasoning_tokens":true,"license":"minimax","open_weight":true,"tagline":"MiniMax-M2.7 is MiniMax's first model deeply participating in its own evolution.","capabilities":{"tool_call":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.25,"output":1,"cached_input":0.05},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","last_updated":"2026-06-18"},{"id":"mistralai/Mistral-Nemo-Instruct-2407","name":"Mistral-Nemo-Instruct-2407","created_by":"mistral","source":"official","last_updated":"2026-04-26","family":"mistral","description":"12B model trained jointly by Mistral AI and NVIDIA, it significantly outperforms existing models smaller or similar in size.","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.02,"output":0.04},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"12B model trained jointly by Mistral AI and NVIDIA, it significantly outperforms existing models smaller or similar in size."},{"id":"mistralai/Mistral-Small-24B-Instruct-2501","name":"Mistral-Small-24B-Instruct-2501","created_by":"mistral","source":"official","last_updated":"2026-04-26","family":"mistral","description":"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks. Released under the Apache 2.0 license, it features both pre-trained and instruction-tuned versions designed for efficient local deployment. The model achieves 81% accuracy on the MMLU benchmark and performs competitively with larger models like Llama 3.3 70B and Qwen 32B, while operating at three times the speed on equivalent hardware.","status":"active","model_type":"chat","context_window":32768,"open_weight":true,"license":"apache-2.0","capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.05,"output":0.08},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks."},{"id":"mistralai/Mistral-Small-3.2-24B-Instruct-2506","name":"Mistral-Small-3.2-24B-Instruct-2506","created_by":"mistral","source":"official","last_updated":"2026-04-26","family":"mistral","description":"Mistral-Small-3.2-24B-Instruct is a drop-in upgrade over the 3.1 release, with markedly better instruction following, roughly half the infinite-generation errors, and a more robust function-calling interface—while otherwise matching or slightly improving on all previous text and vision benchmarks.","status":"active","model_type":"chat","context_window":128000,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.075,"output":0.2},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Mistral-Small-3.2-24B-Instruct is a drop-in upgrade over the 3.1 release, with markedly better instruction following, roughly half the infinite-generation errors, and a more robust function-calling in"},{"id":"mistralai/Mixtral-8x7B-Instruct-v0.1","name":"Mixtral-8x7B-Instruct-v0.1","created_by":"mistral","source":"official","last_updated":"2026-04-26","family":"mixtral","description":"Mixtral is mixture of expert large language model (LLM) from Mistral AI. This is state of the art machine learning model using a mixture 8 of experts (MoE) 7b models. During inference 2 expers are selected. This architecture allows large models to be fast and cheap at inference. The Mixtral-8x7B outperforms Llama 2 70B on most benchmarks.","status":"active","model_type":"chat","context_window":32768,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.54,"output":0.54},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Mixtral is mixture of expert large language model (LLM) from Mistral AI."},{"id":"mistralai/Voxtral-Mini-3B-2507","name":"Voxtral-Mini-3B-2507","created_by":"mistral","source":"official","last_updated":"2026-04-26","family":"mistralai","description":"Voxtral Mini is an enhancement of Ministral 3B, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance. It excels at speech transcription, translation and audio understanding.","status":"active","model_type":"transcription","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"quantization":"bf16","tagline":"Voxtral Mini is an enhancement of Ministral 3B, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance."},{"id":"mistralai/Voxtral-Small-24B-2507","name":"Voxtral-Small-24B-2507","created_by":"mistral","source":"official","last_updated":"2026-04-26","family":"mistralai","description":"Voxtral Small is an enhancement of Mistral Small 3, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance. It excels at speech transcription, translation and audio understanding.","status":"active","model_type":"transcription","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"quantization":"bf16","tagline":"Voxtral Small is an enhancement of Mistral Small 3, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance."},{"id":"moonshotai/Kimi-K2.5","name":"Kimi-K2.5","created_by":"moonshot","source":"official","last_updated":"2026-04-26","family":"Kimi-K2.5","description":"Kimi K2.5 is an open-source, native multimodal agentic model built through continual pretraining on approximately 15 trillion mixed visual and text tokens atop Kimi-K2-Base. It seamlessly integrates vision and language understanding with advanced agentic capabilities, instant and thinking modes, as well as conversational and agentic paradigms.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"modified-mit","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.45,"output":2.25,"cached_input":0.07},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"Kimi K2.5 is an open-source, native multimodal agentic model built through continual pretraining on approximately 15 trillion mixed visual and text tokens atop Kimi-K2-Base.","max_output_tokens":32768},{"id":"moonshotai/Kimi-K2.6","name":"Kimi-K2.6","created_by":"moonshot","source":"official","last_updated":"2026-06-03","family":"Kimi-K2.6","description":"Kimi K2.6 is an open-source, native multimodal agentic model that advances practical capabilities in long-horizon coding, coding-driven design, proactive autonomous execution, and swarm-based task orchestration.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"modified-mit","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.75,"output":3.5,"cached_input":0.15},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"Kimi K2.6 is an open-source, native multimodal agentic model that advances practical capabilities in long-horizon coding, coding-driven design, proactive autonomous execution, and swarm-based task orc"},{"id":"moonshotai/Kimi-K2.7-Code","name":"Kimi-K2.7-Code","created_by":"moonshot","source":"official","family":"Kimi-K2.7","description":"Kimi K2.7 Code is a coding-focused agentic model built upon Kimi K2.6. With substantial improvements on real-world long-horizon coding tasks, it strengthens end-to-end task completion across complex software engineering workflows while improving token efficiency, reducing thinking-token usage by approximately 30% compared with Kimi K2.6.","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"license":"modified-mit","open_weight":true,"tagline":"Kimi K2.7 Code is a coding-focused agentic model built upon Kimi K2.6.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.74,"output":3.5,"cached_input":0.15},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","last_updated":"2026-06-18"},{"id":"NousResearch/Hermes-3-Llama-3.1-405B","name":"Hermes-3-Llama-3.1-405B","created_by":"nousresearch","source":"official","last_updated":"2026-04-26","family":"llama-3.1","description":"Hermes 3 is a cutting-edge language model that offers advanced capabilities in roleplaying, reasoning, and conversation. It's a fine-tuned version of the Llama-3.1 405B foundation model, designed to align with user needs and provide powerful control. Key features include reliable function calling, structured output, generalist assistant capabilities, and improved code generation. Hermes 3 is competitive with Llama-3.1 Instruct models, with its own strengths and weaknesses.","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1,"output":1},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Hermes 3 is a cutting-edge language model that offers advanced capabilities in roleplaying, reasoning, and conversation."},{"id":"NousResearch/Hermes-3-Llama-3.1-70B","name":"Hermes-3-Llama-3.1-70B","created_by":"nousresearch","source":"official","last_updated":"2026-06-10","family":"llama-3.1","description":"Hermes 3 is a generalist language model with many improvements over Hermes 2, including advanced agentic capabilities, much better roleplaying, reasoning, multi-turn conversation, long context coherence, and improvements across the board.","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.7,"output":0.7},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Hermes 3 is a generalist language model with many improvements over Hermes 2, including advanced agentic capabilities, much better roleplaying, reasoning, multi-turn conversation, long context coheren"},{"id":"nvidia/Cosmos3-Nano","name":"Cosmos3-Nano","created_by":"nvidia","source":"official","description":"Cosmos3 is a world foundation model that unifies understanding and generation within a single Mixture-of-Transformer (MoT) architecture. Two tightly coupled towers—a Reasoner (vision-language model) and a Generator (world simulator)—share latent representations so that structured perception directly grounds realistic, temporally consistent simulation.","status":"active","model_type":"video","open_weight":true,"tagline":"Cosmos3 is a world foundation model that unifies understanding and generation within a single Mixture-of-Transformer (MoT) architecture.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.0108 / second (480p)"],"last_updated":"2026-06-03"},{"id":"nvidia/Cosmos3-Super","name":"Cosmos3-Super","created_by":"nvidia","source":"official","description":"Cosmos3 is a world foundation model that unifies understanding and generation within a single Mixture-of-Transformer (MoT) architecture. Two tightly coupled towers—a Reasoner (vision-language model) and a Generator (world simulator)—share latent representations so that structured perception directly grounds realistic, temporally consistent simulation.","status":"active","model_type":"video","open_weight":true,"tagline":"Cosmos3 is a world foundation model that unifies understanding and generation within a single Mixture-of-Transformer (MoT) architecture.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.0432 / second (480p)"],"last_updated":"2026-06-10"},{"id":"nvidia/Llama-3.1-Nemotron-70B-Instruct","name":"Llama-3.1-Nemotron-70B-Instruct","created_by":"nvidia","source":"official","last_updated":"2026-04-26","family":"Llama-3.1","description":"Llama-3.1-Nemotron-70B-Instruct is a large language model customized by NVIDIA to improve the helpfulness of LLM generated responses to user queries. This model reaches Arena Hard of 85.0, AlpacaEval 2 LC of 57.6 and GPT-4-Turbo MT-Bench of 8.98, which are known to be predictive of LMSys Chatbot Arena Elo. As of 16th Oct 2024, this model is #1 on all three automatic alignment benchmarks (verified tab for AlpacaEval 2 LC), edging out strong frontier models such as GPT-4o and Claude 3.5 Sonnet.","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1.2,"output":1.2},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Llama-3.1-Nemotron-70B-Instruct is a large language model customized by NVIDIA to improve the helpfulness of LLM generated responses to user queries."},{"id":"nvidia/Llama-3.3-Nemotron-Super-49B-v1.5","name":"Llama-3.3-Nemotron-Super-49B-v1.5","created_by":"nvidia","source":"official","last_updated":"2026-06-10","family":"Llama-3.3","description":"Llama-3.3-Nemotron-Super-49B-v1.5 is a large language model (LLM) optimized for advanced reasoning, conversational interactions, retrieval-augmented generation (RAG), and tool-calling tasks. Derived from Meta's Llama-3.3-70B-Instruct, it employs a Neural Architecture Search (NAS) approach, significantly enhancing efficiency and reducing memory requirements.","status":"active","model_type":"chat","context_window":131072,"reasoning_tokens":true,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.4,"output":0.4},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Llama-3.3-Nemotron-Super-49B-v1.5 is a large language model (LLM) optimized for advanced reasoning, conversational interactions, retrieval-augmented generation (RAG), and tool-calling tasks."},{"id":"nvidia/llama-nemotron-embed-vl-1b-v2","name":"llama-nemotron-embed-vl-1b-v2","created_by":"nvidia","source":"official","last_updated":"2026-04-26","family":"llama","description":"The llama-nemotron-embed-vl-1b-v2 is a high-performance multimodal embedding model designed to transform text queries and document images into dense vector representations for advanced retrieval systems. It excels at understanding complex visual content like charts, tables, and infographics.","status":"active","model_type":"embed","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The llama-nemotron-embed-vl-1b-v2 is a high-performance multimodal embedding model designed to transform text queries and document images into dense vector representations for advanced retrieval systems."},{"id":"nvidia/llama-nemotron-rerank-vl-1b-v2","name":"llama-nemotron-rerank-vl-1b-v2","created_by":"nvidia","source":"official","last_updated":"2026-04-26","family":"llama","description":"The llama-nemotron-rerank-vl-1b-v2 is a 1.7B parameter multimodal reranking model designed to evaluate and order the relevance of document images and text against specific user queries. It excels at understanding complex visual content like charts, tables, and infographics.","status":"active","model_type":"rerank","open_weight":true,"modalities":{"input":["text"],"output":["text"]},"endpoints":["rerank"],"quantization":"bf16","tagline":"The llama-nemotron-rerank-vl-1b-v2 is a 1.7B parameter multimodal reranking model designed to evaluate and order the relevance of document images and text against specific user queries."},{"id":"nvidia/Nemotron-3-Nano-30B-A3B","name":"Nemotron-3-Nano-30B-A3B","created_by":"nvidia","source":"official","last_updated":"2026-04-26","family":"nemotron","description":"NVIDIA Nemotron 3 Nano is an open small reasoning model optimized for fast, cost-efficient inference in agentic and production workloads. Built with a hybrid Mixture-of-Experts (MoE) and Mamba-Transformer architecture, it delivers strong multi-step reasoning, high token throughput, stable latency with predictable cost, and efficient deployment for agent-based systems. Designed for real-world AI systems where reasoning can generate significantly more tokens per prompt, Nemotron Nano reduces co...","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"capabilities":{"tool_call":true,"reasoning":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.05,"output":0.2},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"NVIDIA Nemotron 3 Nano is an open small reasoning model optimized for fast, cost-efficient inference in agentic and production workloads."},{"id":"nvidia/Nemotron-3-Nano-Omni-30B-A3B-Reasoning","name":"Nemotron-3-Nano-Omni-30B-A3B-Reasoning","created_by":"nvidia","source":"official","description":"Nemotron 3 Nano Omni is an open multimodal model built on a hybrid Mixture-of-Experts (MoE) architecture, engineered for high efficiency and strong accuracy across image, video, audio, and text inputs. It powers always-on sub-agents for computer use, document intelligence, and audio-video understanding—replacing fragmented vision, speech, and language pipelines with a single unified inference pass.","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"open_weight":true,"tagline":"Nemotron 3 Nano Omni is an open multimodal model built on a hybrid Mixture-of-Experts (MoE) architecture, engineered for high efficiency and strong accuracy across image, video, audio, and text inputs.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":0.8},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","last_updated":"2026-06-03"},{"id":"nvidia/Nemotron-3.5-ASR-Streaming-Multilingual-0.6b","name":"Nemotron-3.5-ASR-Streaming-Multilingual-0.6b","created_by":"nvidia","source":"official","description":"Nemotron 3.5 ASR Streaming Multilingual is an open 0.6B-parameter prompt-conditioned cache-aware FastConformer-RNNT model, engineered for low-latency streaming transcription across 40+ languages. It powers real-time captioning, voice agents, and multilingual transcription pipelines—replacing separate per-language Whisper deployments with a single inference pass.","status":"active","model_type":"transcription","open_weight":true,"tagline":"Nemotron 3.5 ASR Streaming Multilingual is an open 0.6B-parameter prompt-conditioned cache-aware FastConformer-RNNT model, engineered for low-latency streaming transcription across 40+ languages.","capabilities":{"streaming":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_updated":"2026-06-10"},{"id":"nvidia/Nemotron-Content-Safety-3.5","name":"Nemotron-Content-Safety-3.5","created_by":"nvidia","source":"official","description":"Nemotron Content Safety 3.5 is a multimodal safety classifier developed by NVIDIA. A compact safety model that handles text, images, and custom policies. It outputs a safe/unsafe classification plus a reasoning trace, and can be used as an inference-time guardrail, as a judge for LLM safety testing and evaluation, or with the accompanying training dataset to post-train models for safer behavior.","status":"active","context_window":131072,"model_type":"chat","open_weight":true,"tagline":"Nemotron Content Safety 3.5 is a multimodal safety classifier developed by NVIDIA.","capabilities":{"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":0.2},"endpoints":["chat_completions"],"quantization":"bfloat16","last_updated":"2026-06-10"},{"id":"nvidia/NVIDIA-Nemotron-3-Super-120B-A12B","name":"NVIDIA-Nemotron-3-Super-120B-A12B","created_by":"nvidia","source":"official","last_updated":"2026-06-29","family":"nemotron","description":"NVIDIA Nemotron 3 Super is a hybrid Mixture-of-Experts (MoE) model engineered for highest compute efficiency and accuracy in multi-agent applications and specialized agentic systems. It is optimized to run many collaborating agents per application on a single GPU, delivering high accuracy for reasoning, tool use, and instruction following.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.085,"output":0.4},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"NVIDIA Nemotron 3 Super is a hybrid Mixture-of-Experts (MoE) model engineered for highest compute efficiency and accuracy in multi-agent applications and specialized agentic systems."},{"id":"nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B-BF16","name":"NVIDIA-Nemotron-3-Ultra-550B-A55B-BF16","created_by":"nvidia","source":"official","description":"Nemotron 3 Ultra is built for, frontier reasoning, orchestration, coding agents, deep research, and complex enterprise workflows. It delivers up to 5x faster inference and up to 30% lower cost for agentic workloads while supporting up to 1M token context.","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"open_weight":true,"tagline":"Nemotron 3 Ultra is built for, frontier reasoning, orchestration, coding agents, deep research, and complex enterprise workflows.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1,"output":5,"cached_input":0.3},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-18"},{"id":"nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B","name":"NVIDIA-Nemotron-3-Ultra-550B-A55B","created_by":"nvidia","source":"official","description":"Nemotron 3 Ultra is built for, frontier reasoning, orchestration, coding agents, deep research, and complex enterprise workflows. It delivers up to 5x faster inference and up to 30% lower cost for agentic workloads while supporting up to 1M token context.","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"open_weight":true,"tagline":"Nemotron 3 Ultra is built for, frontier reasoning, orchestration, coding agents, deep research, and complex enterprise workflows.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.5,"output":2.2,"cached_input":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-18"},{"id":"nvidia/NVIDIA-Nemotron-Nano-12B-v2-VL","name":"NVIDIA-Nemotron-Nano-12B-v2-VL","created_by":"nvidia","source":"official","last_updated":"2026-04-26","family":"nemotron","description":"NVIDIA Nemotron 2 Nano VL extends the Nemotron family into multi-modal reasoning and document intelligence. This auto-regressive vision-language model enables multi-image reasoning, video understanding, visual Q&A and document analysis and summarization. Optimized for enterprise AI workflows, it powers multimodal agentic systems such as visual copilots, document assistants, and knowledge automation pipelines.","status":"active","model_type":"chat","context_window":131072,"reasoning_tokens":true,"open_weight":true,"capabilities":{"reasoning":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":0.6},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"NVIDIA Nemotron 2 Nano VL extends the Nemotron family into multi-modal reasoning and document intelligence."},{"id":"nvidia/NVIDIA-Nemotron-Nano-9B-v2","name":"NVIDIA-Nemotron-Nano-9B-v2","created_by":"nvidia","source":"official","last_updated":"2026-04-26","family":"nemotron","description":"NVIDIA-Nemotron-Nano-9B-v2 is a large language model (LLM) trained from scratch by NVIDIA, and designed as a unified model for both reasoning and non-reasoning tasks. It responds to user queries and tasks by first generating a reasoning trace and then concluding with a final response. The model's reasoning capabilities can be controlled via a system prompt. If the user prefers the model to provide its final answer without intermediate reasoning traces, it can be configured to do so.","status":"active","model_type":"chat","context_window":131072,"reasoning_tokens":true,"open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.04,"output":0.16},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"NVIDIA-Nemotron-Nano-9B-v2 is a large language model (LLM) trained from scratch by NVIDIA, and designed as a unified model for both reasoning and non-reasoning tasks."},{"id":"openai/clip-vit-base-patch32","name":"clip-vit-base-patch32","created_by":"openai","source":"official","last_updated":"2026-04-26","family":"openai","description":"The CLIP model was developed by OpenAI to investigate the robustness of computer vision models. It uses a Vision Transformer architecture and was trained on a large dataset of image-caption pairs. The model shows promise in various computer vision tasks but also has limitations, including difficulties with fine-grained classification and potential biases in certain applications.","status":"active","model_type":"image","open_weight":true,"license":"proprietary","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.000500 per second"],"tagline":"The CLIP model was developed by OpenAI to investigate the robustness of computer vision models."},{"id":"openai/clip-vit-large-patch14-336","name":"clip-vit-large-patch14-336","created_by":"openai","source":"official","last_updated":"2026-04-26","family":"openai","description":"A zero-shot-image-classification model released by OpenAI. The clip-vit-large-patch14-336 model was trained from scratch on an unknown dataset and achieves unspecified results on the evaluation set. The model's intended uses and limitations, as well as its training and evaluation data, are not provided. The training procedure used an unknown optimizer and precision, and the framework versions included Transformers 4.21.3, TensorFlow 2.8.2, and Tokenizers 0.12.1.","status":"active","model_type":"image","open_weight":true,"license":"proprietary","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.000500 per second"],"tagline":"A zero-shot-image-classification model released by OpenAI."},{"id":"openai/gpt-oss-120b-Turbo","name":"gpt-oss-120b-Turbo","created_by":"openai","source":"official","last_updated":"2026-04-26","family":"gpt-oss","status":"active","model_type":"chat","context_window":131072,"reasoning_tokens":true,"open_weight":true,"license":"proprietary","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.15,"output":0.6},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16"},{"id":"openai/gpt-oss-120b","name":"gpt-oss-120b","created_by":"openai","source":"official","last_updated":"2026-04-26","family":"gpt-oss","description":"gpt-oss-120b is an open-weight, 117B-parameter Mixture-of-Experts (MoE) language model from OpenAI designed for high-reasoning, agentic, and general-purpose production use cases. The model supports configurable reasoning depth, full chain-of-thought access, and native tool use, including function calling, browsing, and structured output generation.","status":"active","model_type":"chat","context_window":131072,"reasoning_tokens":true,"open_weight":true,"license":"proprietary","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":false,"vision":false,"batch":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.039,"output":0.19},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"gpt-oss-120b is an open-weight, 117B-parameter Mixture-of-Experts (MoE) language model from OpenAI designed for high-reasoning, agentic, and general-purpose production use cases.","max_output_tokens":131072,"knowledge_cutoff":"2024-06","parameters":120},{"id":"openai/gpt-oss-20b","name":"gpt-oss-20b","created_by":"openai","source":"official","last_updated":"2026-04-26","family":"gpt-oss","description":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.0 license. It uses a Mixture-of-Experts (MoE) architecture with 3.6B active parameters per forward pass, optimized for lower-latency inference. The model is trained in OpenAI’s Harmony response format and supports reasoning level configuration, fine-tuning, and agentic capabilities including function calling, tool use, and structured outputs.","status":"active","model_type":"chat","context_window":131072,"reasoning_tokens":true,"open_weight":true,"license":"proprietary","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":false,"vision":false,"batch":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.03,"output":0.14},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.0 license.","max_output_tokens":131072,"knowledge_cutoff":"2024-06","parameters":20},{"id":"openai/whisper-large-v3-turbo","name":"whisper-large-v3-turbo","created_by":"openai","source":"official","last_updated":"2026-04-26","family":"whisper","description":"Whisper is a state-of-the-art model for automatic speech recognition (ASR) and speech translation, proposed in the paper \"Robust Speech Recognition via Large-Scale Weak Supervision\" by Alec Radford et al. from OpenAI. Trained on >5M hours of labeled data, Whisper demonstrates a strong ability to generalise to many datasets and domains in a zero-shot setting. Whisper large-v3-turbo is a finetuned version of a pruned Whisper large-v3. In other words, it's the exact same model, except that the n...","status":"active","model_type":"transcription","open_weight":true,"license":"proprietary","capabilities":{"streaming":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"tagline":"Whisper is a state-of-the-art model for automatic speech recognition (ASR) and speech translation, proposed in the paper \"Robust Speech Recognition via Large-Scale Weak Supervision\" by Alec Radford et al."},{"id":"openai/whisper-large-v3","name":"whisper-large-v3","created_by":"openai","source":"official","last_updated":"2026-04-26","family":"whisper","description":"Whisper is a general-purpose speech recognition model. It is trained on a large dataset of diverse audio and is also a multi-task model that can perform multilingual speech recognition as well as speech translation and language identification.","status":"active","model_type":"transcription","open_weight":true,"license":"proprietary","capabilities":{"streaming":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"tagline":"Whisper is a general-purpose speech recognition model."},{"id":"PaddlePaddle/PaddleOCR-VL-0.9B","name":"PaddleOCR-VL-0.9B","created_by":"paddlepaddle","source":"official","last_updated":"2026-04-26","family":"paddlepaddle","description":"PaddleOCR-VL is a SOTA and resource-efficient model tailored for document parsing. Its core component is PaddleOCR-VL-0.9B, a compact yet powerful vision-language model (VLM) that integrates a NaViT-style dynamic resolution visual encoder with the ERNIE-4.5-0.3B language model to enable accurate element recognition. This innovative model efficiently supports 109 languages and excels in recognizing complex elements (e.g., text, tables, formulas, and charts), while maintaining minimal resource ...","status":"active","model_type":"chat","context_window":16384,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.14,"output":0.8},"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"PaddleOCR-VL is a SOTA and resource-efficient model tailored for document parsing."},{"id":"Pixverse/Pixverse-6-I2V","name":"Pixverse-6-I2V","created_by":"pixverse","source":"official","description":"PixVerse V6 redefines AI video by shifting from isolated generation to a unified, model-driven workflow. Key upgrades include 15-second durations at 1080p resolution and a multi-shot engine. This transition allows creators to move beyond short clips toward meaningful narrative production and professional-grade marketing assets suitable for 2026 digital distribution standards.","status":"active","model_type":"video","open_weight":false,"tagline":"PixVerse V6 redefines AI video by shifting from isolated generation to a unified, model-driven workflow.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.045 / second"],"last_updated":"2026-06-03"},{"id":"Pixverse/Pixverse-6-T2V","name":"Pixverse-6-T2V","created_by":"pixverse","source":"official","description":"PixVerse V6 redefines AI video by shifting from isolated generation to a unified, model-driven workflow. Key upgrades include 15-second durations at 1080p resolution and a multi-shot engine. This transition allows creators to move beyond short clips toward meaningful narrative production and professional-grade marketing assets suitable for 2026 digital distribution standards.","status":"active","model_type":"video","open_weight":false,"tagline":"PixVerse V6 redefines AI video by shifting from isolated generation to a unified, model-driven workflow.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.045 / second"],"last_updated":"2026-06-03"},{"id":"Pixverse/Pixverse-T2V-HD","name":"Pixverse-T2V-HD","created_by":"pixverse","source":"official","last_updated":"2026-04-26","family":"pixverse","description":"The 1080p high-fidelity mode in PixVerse renders videos with significantly enhanced sharpness and visual clarity, capturing intricate details and providing a crisp, professional-grade quality suitable for more polished projects.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.4000 per image unit (0x0 default)"],"tagline":"The 1080p high-fidelity mode in PixVerse renders videos with significantly enhanced sharpness and visual clarity, capturing intricate details and providing a crisp, professional-grade quality suitable"},{"id":"Pixverse/Pixverse-T2V","name":"Pixverse-T2V","created_by":"pixverse","source":"official","last_updated":"2026-04-26","family":"pixverse","description":"PixVerse's 720p resolution offers a fast and reliable option for generating standard HD videos, ideal for quick previews and social media content where generation speed is prioritized over maximum detail.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.2000 per image unit (0x0 default)"],"tagline":"PixVerse's 720p resolution offers a fast and reliable option for generating standard HD videos, ideal for quick previews and social media content where generation speed is prioritized over maximum det"},{"id":"PrunaAI/p-image-Edit","name":"p-image-Edit","created_by":"prunaai","source":"official","last_updated":"2026-04-26","family":"prunaai","description":"P-Image-Edit is a high-precision image editing model that applies complex transformations, insertions, removals, and style adjustments in under a second. It delivers state-of-the-art accuracy, clean boundaries, and reliable prompt alignment, making multi-step edits fast, consistent, and production-ready.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0100 per image unit (0x0 default)"],"tagline":"P-Image-Edit is a high-precision image editing model that applies complex transformations, insertions, removals, and style adjustments in under a second."},{"id":"PrunaAI/p-image","name":"p-image","created_by":"prunaai","source":"official","last_updated":"2026-04-26","family":"prunaai","description":"P-Image is a state-of-the-art real-time generation model with exceptional text rendering, fine-detail accuracy, and rock-solid prompt adherence. It’s built for instant creativity at high-fidelity images in about one second at a fraction of typical model costs.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0050 per image unit (0x0 default)"],"tagline":"P-Image is a state-of-the-art real-time generation model with exceptional text rendering, fine-detail accuracy, and rock-solid prompt adherence."},{"id":"PrunaAI/p-video-avatar","name":"p-video-avatar","created_by":"prunaai","source":"official","description":"Pruna's talking head video generation model. Provide a portrait image and either a speech script or an audio file, and the model generates a realistic video of the person speaking. Supports multiple voices, languages, and output resolutions.","status":"active","model_type":"video","open_weight":false,"tagline":"Pruna's talking head video generation model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.025 / second"],"last_updated":"2026-06-03"},{"id":"PrunaAI/p-video","name":"p-video","created_by":"prunaai","source":"official","last_updated":"2026-04-26","family":"prunaai","description":"Real-time AI video generation from text, images, and audio. Supports up to 1080p at 48 FPS with built-in audio generation, draft mode for 4x faster previews, and prompt upsampling.","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.02 / second"],"tagline":"Real-time AI video generation from text, images, and audio."},{"id":"Qwen/Qwen-Image-Edit-Max","name":"Qwen-Image-Edit-Max","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen","description":"Enhanced industrial design and geometric reasoning, improved character consistency, reduced offset issues, and integrated LoRA capabilities","status":"active","model_type":"image","open_weight":false,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0750 per image unit (0x0 default)"],"tagline":"Enhanced industrial design and geometric reasoning, improved character consistency, reduced offset issues, and integrated LoRA capabilities"},{"id":"Qwen/Qwen-Image-Edit","name":"Qwen-Image-Edit","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen","description":"Qwen-Image-Edit is a next-generation image editing model built on top of Qwen-Image, designed for both semantic and appearance-level edits. It excels at tasks like precise text modifications, style transfers, viewpoint transformations, and element adjustments while preserving overall visual consistency.","status":"active","model_type":"image","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0250 per image unit (1024x1024 default)"],"tagline":"Qwen-Image-Edit is a next-generation image editing model built on top of Qwen-Image, designed for both semantic and appearance-level edits."},{"id":"Qwen/Qwen-Image-Max","name":"Qwen-Image-Max","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen","description":"Compared with the Plus series, it significantly reduces the “AI-like” feel in generated images, enhancing their realism. It delivers more lifelike material textures for human subjects, finer and more detailed natural textures, and more visually appealing text rendering.","status":"active","model_type":"image","open_weight":false,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0750 per image unit (0x0 default)"],"tagline":"Compared with the Plus series, it significantly reduces the “AI-like” feel in generated images, enhancing their realism."},{"id":"Qwen/Qwen2.5-72B-Instruct","name":"Qwen2.5-72B-Instruct","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen2.5","description":"Qwen2.5 is a model pretrained on a large-scale dataset of up to 18 trillion tokens, offering significant improvements in knowledge, coding, mathematics, and instruction following compared to its predecessor Qwen2. The model also features enhanced capabilities in generating long texts, understanding structured data, and generating structured outputs, while supporting multilingual capabilities for over 29 languages.","status":"active","model_type":"chat","context_window":32768,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.36,"output":0.4},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen2.5 is a model pretrained on a large-scale dataset of up to 18 trillion tokens, offering significant improvements in knowledge, coding, mathematics, and instruction following compared to its predecessor Qwen2."},{"id":"Qwen/Qwen3-14B","name":"Qwen3-14B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Qwen3 is the latest generation of large language models in Qwen series, offering a comprehensive suite of dense and mixture-of-experts (MoE) models. Built upon extensive training, Qwen3 delivers groundbreaking advancements in reasoning, instruction-following, agent capabilities, and multilingual support.","status":"active","model_type":"chat","context_window":40960,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.12,"output":0.24},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3 is the latest generation of large language models in Qwen series, offering a comprehensive suite of dense and mixture-of-experts (MoE) models."},{"id":"Qwen/Qwen3-235B-A22B-Instruct-2507","name":"Qwen3-235B-A22B-Instruct-2507","created_by":"alibaba","source":"official","last_updated":"2026-06-10","family":"qwen3","description":"Qwen3-235B-A22B-Instruct-2507 is the updated version of the Qwen3-235B-A22B non-thinking mode, featuring Significant improvements in general capabilities, including instruction following, logical reasoning, text comprehension, mathematics, science, coding and tool usage.","status":"active","model_type":"chat","context_window":262144,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.09,"output":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3-235B-A22B-Instruct-2507 is the updated version of the Qwen3-235B-A22B non-thinking mode, featuring Significant improvements in general capabilities, including instruction following, logical reas"},{"id":"Qwen/Qwen3-235B-A22B-Thinking-2507","name":"Qwen3-235B-A22B-Thinking-2507","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Qwen3-235B-A22B-Thinking-2507 is the Qwen3's new model with scaling the thinking capability of Qwen3-235B-A22B, improving both the quality and depth of reasoning.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.23,"output":2.3,"cached_input":0.2},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3-235B-A22B-Thinking-2507 is the Qwen3's new model with scaling the thinking capability of Qwen3-235B-A22B, improving both the quality and depth of reasoning."},{"id":"Qwen/Qwen3-30B-A3B","name":"Qwen3-30B-A3B","created_by":"alibaba","source":"official","last_updated":"2026-06-10","family":"qwen3","description":"Qwen3 is the latest generation of large language models in Qwen series, offering a comprehensive suite of dense and mixture-of-experts (MoE) models. Built upon extensive training, Qwen3 delivers groundbreaking advancements in reasoning, instruction-following, agent capabilities, and multilingual support","status":"active","model_type":"chat","context_window":40960,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.12,"output":0.5},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3 is the latest generation of large language models in Qwen series, offering a comprehensive suite of dense and mixture-of-experts (MoE) models."},{"id":"Qwen/Qwen3-32B","name":"Qwen3-32B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Qwen3 is the latest generation of large language models in Qwen series, offering a comprehensive suite of dense and mixture-of-experts (MoE) models. Built upon extensive training, Qwen3 delivers groundbreaking advancements in reasoning, instruction-following, agent capabilities, and multilingual support","status":"active","model_type":"chat","context_window":40960,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.08,"output":0.28},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3 is the latest generation of large language models in Qwen series, offering a comprehensive suite of dense and mixture-of-experts (MoE) models."},{"id":"Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo","name":"Qwen3-Coder-480B-A35B-Instruct-Turbo","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Qwen3-Coder-480B-A35B-Instruct is the Qwen3's most agentic code model, featuring Significant Performance on Agentic Coding, Agentic Browser-Use and other foundational coding tasks, achieving results comparable to Claude Sonnet.","status":"active","model_type":"chat","context_window":262144,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.3,"output":1,"cached_input":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"Qwen3-Coder-480B-A35B-Instruct is the Qwen3's most agentic code model, featuring Significant Performance on Agentic Coding, Agentic Browser-Use and other foundational coding tasks, achieving results c"},{"id":"Qwen/Qwen3-Embedding-0.6B-batch","name":"Qwen3-Embedding-0.6B-batch","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B).","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Embedding-0.6B","name":"Qwen3-Embedding-0.6B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B).","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Embedding-4B-batch","name":"Qwen3-Embedding-4B-batch","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B).","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Embedding-4B","name":"Qwen3-Embedding-4B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B).","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Embedding-8B-batch","name":"Qwen3-Embedding-8B-batch","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B).","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Embedding-8B","name":"Qwen3-Embedding-8B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B).","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Max-Thinking","name":"Qwen3-Max-Thinking","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The latest flagship reasoning model in the Qwen3 family. Further enhanced by multiple innovations like adaptive tool-use and advanced test-time scaling techniques","status":"active","model_type":"chat","context_window":256000,"open_weight":false,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1.2,"output":6,"cached_input":0.24},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"The latest flagship reasoning model in the Qwen3 family."},{"id":"Qwen/Qwen3-Max","name":"Qwen3-Max","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The latest flagship model in the Qwen family. State-of-the-art results across a comprehensive suite of benchmarks — including knowledge, reasoning, coding, instruction following, human preference alignment, agent tasks, and multilingual understanding.","status":"active","model_type":"chat","context_window":256000,"open_weight":false,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1.2,"output":6,"cached_input":0.24},"tools":["function_calling"],"endpoints":["chat_completions"],"tagline":"The latest flagship model in the Qwen family."},{"id":"Qwen/Qwen3-Next-80B-A3B-Instruct","name":"Qwen3-Next-80B-A3B-Instruct","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Over the past few months, we have observed increasingly clear trends toward scaling both total parameters and context lengths in the pursuit of more powerful and agentic artificial intelligence (AI). We are excited to share our latest advancements in addressing these demands, centered on improving scaling efficiency through innovative model architecture. We call this next-generation foundation models Qwen3-Next.","status":"active","model_type":"chat","context_window":262144,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.09,"output":1.1},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Over the past few months, we have observed increasingly clear trends toward scaling both total parameters and context lengths in the pursuit of more powerful and agentic artificial intelligence (AI)."},{"id":"Qwen/Qwen3-Reranker-0.6B","name":"Qwen3-Reranker-0.6B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B)","status":"active","model_type":"rerank","open_weight":true,"license":"apache-2.0","modalities":{"input":["text"],"output":["text"]},"endpoints":["rerank"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Reranker-4B","name":"Qwen3-Reranker-4B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B)","status":"active","model_type":"rerank","open_weight":true,"license":"apache-2.0","modalities":{"input":["text"],"output":["text"]},"endpoints":["rerank"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-Reranker-8B","name":"Qwen3-Reranker-8B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks. Building upon the dense foundational models of the Qwen3 series, it provides a comprehensive range of text embeddings and reranking models in various sizes (0.6B, 4B, and 8B)","status":"active","model_type":"rerank","open_weight":true,"license":"apache-2.0","modalities":{"input":["text"],"output":["text"]},"endpoints":["rerank"],"tagline":"The Qwen3 Embedding model series is the latest proprietary model of the Qwen family, specifically designed for text embedding and ranking tasks."},{"id":"Qwen/Qwen3-TTS-VoiceDesign","name":"Qwen3-TTS-VoiceDesign","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"● Qwen3-TTS-VoiceDesign is a voice design variant of Qwen3-TTS by Alibaba's Qwen team. Instead of selecting from preset voices, you describe the voice you want in natural language — and the model generates speech in that voice. Key capabilities: - Natural language voice control — describe any voice with free text (e.g. \"a deep male voice with a calm, authoritative presence\", \"a young cheerful female with a warm and friendly tone\") - 10 languages — English, Chinese, Japanese, Korean, German, F...","status":"active","model_type":"tts","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$20.0000 per 1M input characters"],"tagline":"● Qwen3-TTS-VoiceDesign is a voice design variant of Qwen3-TTS by Alibaba's Qwen team."},{"id":"Qwen/Qwen3-TTS","name":"Qwen3-TTS","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Qwen3-TTS is an advanced text-to-speech model by Alibaba's Qwen team, delivering stable, expressive, and low-latency speech generation across 10 languages. Key capabilities: - 9 preset voices — Vivian, Serena, Uncle_Fu, Dylan, Eric, Ryan, Aiden, Ono_Anna, Sohee — covering diverse genders, ages, and accents - Voice cloning — clone any voice from a short (~3s) audio sample via the voice_id parameter - Instruction control — adjust tone, emotion, and speaking style with natural language (e.g. \"sp...","status":"active","model_type":"tts","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$20.0000 per 1M input characters"],"tagline":"Qwen3-TTS is an advanced text-to-speech model by Alibaba's Qwen team, delivering stable, expressive, and low-latency speech generation across 10 languages."},{"id":"Qwen/Qwen3-VL-235B-A22B-Instruct","name":"Qwen3-VL-235B-A22B-Instruct","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Meet Qwen3-VL — the most powerful vision-language model in the Qwen series to date. This generation delivers comprehensive upgrades across the board: superior text understanding & generation, deeper visual perception & reasoning, extended context length, enhanced spatial and video dynamics comprehension, and stronger agent interaction capabilities.","status":"active","model_type":"chat","context_window":262144,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":0.88,"cached_input":0.11},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Meet Qwen3-VL — the most powerful vision-language model in the Qwen series to date."},{"id":"Qwen/Qwen3-VL-30B-A3B-Instruct","name":"Qwen3-VL-30B-A3B-Instruct","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Meet Qwen3-VL — the most powerful vision-language model in the Qwen series to date. This generation delivers comprehensive upgrades across the board: superior text understanding & generation, deeper visual perception & reasoning, extended context length, enhanced spatial and video dynamics comprehension, and stronger agent interaction capabilities.","status":"active","model_type":"chat","context_window":262144,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.15,"output":0.6},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Meet Qwen3-VL — the most powerful vision-language model in the Qwen series to date."},{"id":"Qwen/Qwen3.5-0.8B","name":"Qwen3.5-0.8B","created_by":"alibaba","source":"official","last_updated":"2026-06-03","family":"qwen3","description":"Qwen3.5-0.8B is Alibaba's smallest model in the Qwen3.5 series, featuring a hybrid Gated Delta Networks and sparse Mixture-of-Experts architecture. Despite its compact size, it supports a 262K token context window, 201 languages, thinking/reasoning mode, and tool calling. Ideal for edge deployments, resource-constrained environments, and lightweight inference tasks.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.01,"output":0.05},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"Qwen3.5-0.8B is Alibaba's smallest model in the Qwen3.5 series, featuring a hybrid Gated Delta Networks and sparse Mixture-of-Experts architecture."},{"id":"Qwen/Qwen3.5-122B-A10B","name":"Qwen3.5-122B-A10B","created_by":"alibaba","source":"official","last_updated":"2026-06-29","family":"qwen3","description":"Qwen3.5-122B-A10B is a large Mixture-of-Experts model from Alibaba's Qwen3.5 series with 122B total parameters and 10B activated per token. It features a 262K token context window (extensible to 1M with YaRN), thinking/reasoning mode, tool calling, and support for 201 languages. Excels at complex reasoning, coding, multimodal understanding, and agentic tasks with the efficiency of sparse activation.","status":"active","model_type":"chat","context_window":16384,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.29,"output":2.4,"cached_input":0.145},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"Qwen3.5-122B-A10B is a large Mixture-of-Experts model from Alibaba's Qwen3.5 series with 122B total parameters and 10B activated per token."},{"id":"Qwen/Qwen3.5-27B","name":"Qwen3.5-27B","created_by":"alibaba","source":"official","last_updated":"2026-04-26","family":"qwen3","description":"Qwen3.5-27B is Alibaba's largest dense Qwen3.5 model, delivering near-frontier quality across reasoning, coding, and instruction following. It features a 262K token context window (extensible to 1M), thinking/reasoning mode, tool calling, multi-token prediction, and support for 201 languages. Best suited for production deployments and complex enterprise tasks requiring top-tier performance.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.26,"output":2.6},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3.5-27B is Alibaba's largest dense Qwen3.5 model, delivering near-frontier quality across reasoning, coding, and instruction following."},{"id":"Qwen/Qwen3.5-2B","name":"Qwen3.5-2B","created_by":"alibaba","source":"official","last_updated":"2026-06-03","family":"qwen3","description":"Qwen3.5-2B is a compact yet capable model from Alibaba's Qwen3.5 series. It features a 262K token context window, support for 201 languages, thinking/reasoning mode, and tool calling for agentic workflows. A strong choice for prototyping, fine-tuning, and efficient multilingual deployments.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.02,"output":0.1},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"Qwen3.5-2B is a compact yet capable model from Alibaba's Qwen3.5 series."},{"id":"Qwen/Qwen3.5-35B-A3B","name":"Qwen3.5-35B-A3B","created_by":"alibaba","source":"official","last_updated":"2026-06-03","family":"qwen3","description":"Qwen3.5-35B-A3B is an efficient Mixture-of-Experts model from Alibaba's Qwen3.5 series with 35B total parameters and only 3B activated per token. It features a 262K token context window (extensible to 1M with YaRN), thinking/reasoning mode, tool calling, and support for 201 languages. Delivers strong performance on reasoning, coding, and vision-language tasks at a fraction of the compute cost.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.14,"output":1,"cached_input":0.05},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3.5-35B-A3B is an efficient Mixture-of-Experts model from Alibaba's Qwen3.5 series with 35B total parameters and only 3B activated per token."},{"id":"Qwen/Qwen3.5-397B-A17B","name":"Qwen3.5-397B-A17B","created_by":"alibaba","source":"official","last_updated":"2026-06-10","family":"qwen3","description":"Qwen3.5-397B-A17B is Alibaba's most capable Qwen3.5 model, a Mixture-of-Experts architecture with 397B total parameters and 17B activated per token. It features a 262K token context window (extensible to 1M with YaRN), thinking/reasoning mode, tool calling with MCP integration, and support for 201 languages. Sets state-of-the-art results on reasoning, coding, math, and multimodal benchmarks.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.45,"output":3,"cached_input":0.22},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3.5-397B-A17B is Alibaba's most capable Qwen3.5 model, a Mixture-of-Experts architecture with 397B total parameters and 17B activated per token."},{"id":"Qwen/Qwen3.5-4B","name":"Qwen3.5-4B","created_by":"alibaba","source":"official","last_updated":"2026-06-03","family":"qwen3","description":"Qwen3.5-4B is a mid-size model from Alibaba's Qwen3.5 series that delivers a strong balance of performance and efficiency. It features a 262K token context window (extensible to 1M with YaRN), thinking/reasoning mode, tool calling, and support for 201 languages. Well-suited for complex reasoning, code generation, and agentic applications.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.03,"output":0.15},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"Qwen3.5-4B is a mid-size model from Alibaba's Qwen3.5 series that delivers a strong balance of performance and efficiency."},{"id":"Qwen/Qwen3.5-9B","name":"Qwen3.5-9B","created_by":"alibaba","source":"official","description":"Qwen3.5-9B is a high-performance model from Alibaba's Qwen3.5 series with a hybrid Gated Delta Networks and sparse MoE architecture. It features a 262K token context window, thinking/reasoning mode, tool calling, multi-token prediction, and support for 201 languages. Excels at reasoning, coding, instruction following, and long-context tasks.","status":"active","context_window":262144,"model_type":"chat","license":"apache-2.0","open_weight":true,"tagline":"Qwen3.5-9B is a high-performance model from Alibaba's Qwen3.5 series with a hybrid Gated Delta Networks and sparse MoE architecture.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.1,"output":0.15},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","last_updated":"2026-06-10"},{"id":"Qwen/Qwen3.6-27B","name":"Qwen3.6-27B","created_by":"alibaba","source":"official","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"license":"apache-2.0","open_weight":true,"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.32,"output":3.2},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","last_updated":"2026-06-03"},{"id":"Qwen/Qwen3.6-35B-A3B","name":"Qwen3.6-35B-A3B","created_by":"alibaba","source":"official","last_updated":"2026-06-03","family":"qwen3","description":"Qwen3.6-35B-A3B is Alibaba's latest flagship Mixture-of-Experts model, with 35B total parameters and only 3B activated per token (256 experts, 8 routed + 1 shared). Built on direct feedback from the community, Qwen3.6 prioritizes stability and real-world utility, offering developers a more intuitive, responsive, and genuinely productive coding experience.","status":"active","model_type":"chat","context_window":262144,"reasoning_tokens":true,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.15,"output":0.95},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Qwen3.6-35B-A3B is Alibaba's latest flagship Mixture-of-Experts model, with 35B total parameters and only 3B activated per token (256 experts, 8 routed + 1 shared)."},{"id":"Qwen/Qwen3.7-Max","name":"Qwen3.7-Max","created_by":"alibaba","source":"official","description":"The largest and most capable in the Qwen3.7 series. Qwen3.7 is a next‑generation flagship model designed for the agent‑centric.","status":"active","context_window":256000,"model_type":"chat","license":"apache-2.0","open_weight":false,"tagline":"The largest and most capable in the Qwen3.7 series.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":2.5,"output":7.5,"cached_input":0.5},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03"},{"id":"ResembleAI/chatterbox-multilingual","name":"chatterbox-multilingual","created_by":"resembleai","source":"official","last_updated":"2026-04-26","family":"resembleai","description":"09/04 🔥 Introducing Chatterbox Multilingual in 23 Languages! We're excited to introduce Chatterbox and Chatterbox Multilingual, Resemble AI's production-grade open source TTS models. Chatterbox Multilingual supports Arabic, Danish, German, Greek, English, Spanish, Finnish, French, Hebrew, Hindi, Italian, Japanese, Korean, Malay, Dutch, Norwegian, Polish, Portuguese, Russian, Swedish, Swahili, Turkish, Chinese out of the box. Licensed under MIT, Chatterbox has been benchmarked against leading...","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$1.0000 per 1M input characters"],"tagline":"09/04 🔥 Introducing Chatterbox Multilingual in 23 Languages! We're excited to introduce Chatterbox and Chatterbox Multilingual, Resemble AI's production-grade open source TTS models."},{"id":"ResembleAI/chatterbox-turbo","name":"chatterbox-turbo","created_by":"resembleai","source":"official","last_updated":"2026-04-26","family":"resembleai","description":"Chatterbox is a family of three state-of-the-art, open-source text-to-speech models by Resemble AI. We are excited to introduce Chatterbox-Turbo, our most efficient model yet. Built on a streamlined 350M parameter architecture, Turbo delivers high-quality speech with less compute and VRAM than our previous models. We have also distilled the speech-token-to-mel decoder, previously a bottleneck, reducing generation from 10 steps to just one, while retaining high-fidelity audio output. Paralingu...","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$1.0000 per 1M input characters"],"tagline":"Chatterbox is a family of three state-of-the-art, open-source text-to-speech models by Resemble AI."},{"id":"Sao10K/L3-8B-Lunaris-v1-Turbo","name":"L3-8B-Lunaris-v1-Turbo","created_by":"sao10k","source":"official","last_updated":"2026-04-26","family":"sao10k","status":"active","model_type":"chat","context_window":8192,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.04,"output":0.05},"endpoints":["chat_completions"],"quantization":"fp8"},{"id":"Sao10K/L3.1-70B-Euryale-v2.2","name":"L3.1-70B-Euryale-v2.2","created_by":"sao10k","source":"official","last_updated":"2026-04-26","family":"sao10k","description":"Euryale 3.1 - 70B v2.2 is a model focused on creative roleplay from Sao10k","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.85,"output":0.85},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Euryale 3.1 - 70B v2.2 is a model focused on creative roleplay from Sao10k"},{"id":"Sao10K/L3.3-70B-Euryale-v2.3","name":"L3.3-70B-Euryale-v2.3","created_by":"sao10k","source":"official","last_updated":"2026-04-26","family":"sao10k","description":"L3.3-70B-Euryale-v2.3 is a model focused on creative roleplay from Sao10k","status":"active","model_type":"chat","context_window":131072,"open_weight":true,"capabilities":{"structured_output":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.85,"output":0.85},"endpoints":["chat_completions"],"quantization":"fp8","tagline":"L3.3-70B-Euryale-v2.3 is a model focused on creative roleplay from Sao10k"},{"id":"sentence-transformers/all-MiniLM-L12-v2","name":"all-MiniLM-L12-v2","created_by":"sentence-transformers","source":"official","last_updated":"2026-04-26","family":"sentence-transformers","description":"We present a sentence transformation model that generates semantically similar sentences. Our model is based on the Sentence-Transformers architecture and was trained on a large dataset of sentence pairs. We evaluate the effectiveness of our model by measuring its ability to generate similar sentences that are close to the original sentence in meaning.","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"We present a sentence transformation model that generates semantically similar sentences."},{"id":"sentence-transformers/all-MiniLM-L6-v2","name":"all-MiniLM-L6-v2","created_by":"sentence-transformers","source":"official","last_updated":"2026-04-26","family":"sentence-transformers","description":"We present a sentence transformation model that achieves state-of-the-art results on various NLP tasks without requiring task-specific architectures or fine-tuning. Our approach leverages contrastive learning and utilizes a variety of datasets to learn robust sentence representations. We evaluate our model on several benchmarks and demonstrate its effectiveness in various applications such as text classification, sentiment analysis, named entity recognition, and question answering.","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"We present a sentence transformation model that achieves state-of-the-art results on various NLP tasks without requiring task-specific architectures or fine-tuning."},{"id":"sentence-transformers/all-mpnet-base-v2","name":"all-mpnet-base-v2","created_by":"sentence-transformers","source":"official","last_updated":"2026-04-26","family":"sentence-transformers","description":"A sentence transformation model that has been trained on a wide range of datasets, including but not limited to S2ORC, WikiAnwers, PAQ, Stack Exchange, and Yahoo! Answers. Our model can be used for various NLP tasks such as clustering, sentiment analysis, and question answering.","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"A sentence transformation model that has been trained on a wide range of datasets, including but not limited to S2ORC, WikiAnwers, PAQ, Stack Exchange, and Yahoo! Answers."},{"id":"sentence-transformers/clip-ViT-B-32-multilingual-v1","name":"clip-ViT-B-32-multilingual-v1","created_by":"sentence-transformers","source":"official","last_updated":"2026-04-26","family":"sentence-transformers","description":"This model is a multilingual version of the OpenAI CLIP-ViT-B32 model, which maps text and images to a common dense vector space. It includes a text embedding model that works for 50+ languages and an image encoder from CLIP. The model was trained using Multilingual Knowledge Distillation, where a multilingual DistilBERT model was trained as a student model to align the vector space of the original CLIP image encoder across many languages.","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"This model is a multilingual version of the OpenAI CLIP-ViT-B32 model, which maps text and images to a common dense vector space."},{"id":"sentence-transformers/clip-ViT-B-32","name":"clip-ViT-B-32","created_by":"sentence-transformers","source":"official","last_updated":"2026-04-26","family":"sentence-transformers","description":"The CLIP model maps text and images to a shared vector space, enabling various applications such as image search, zero-shot image classification, and image clustering. The model can be used easily after installation, and its performance is demonstrated through zero-shot ImageNet validation set accuracy scores. Multilingual versions of the model are also available for 50+ languages.","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The CLIP model maps text and images to a shared vector space, enabling various applications such as image search, zero-shot image classification, and image clustering."},{"id":"sentence-transformers/multi-qa-mpnet-base-dot-v1","name":"multi-qa-mpnet-base-dot-v1","created_by":"sentence-transformers","source":"official","last_updated":"2026-04-26","family":"sentence-transformers","description":"We present a sentence transformation model that maps sentences and paragraphs to a 768-dimensional dense vector space, suitable for semantic search tasks. The model is trained on 215 million question-answer pairs from various sources, including WikiAnswers, PAQ, Stack Exchange, MS MARCO, GOOAQ, Amazon QA, Yahoo Answers, Search QA, ELI5, and Natural Questions. Our model uses a contrastive learning objective.","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"We present a sentence transformation model that maps sentences and paragraphs to a 768-dimensional dense vector space, suitable for semantic search tasks."},{"id":"sentence-transformers/paraphrase-MiniLM-L6-v2","name":"paraphrase-MiniLM-L6-v2","created_by":"sentence-transformers","source":"official","last_updated":"2026-04-26","family":"sentence-transformers","description":"We present a sentence similarity model based on the Sentence Transformers architecture, which maps sentences to a 384-dimensional dense vector space. The model uses a pre-trained BERT encoder and applies mean pooling on top of the contextualized word embeddings to obtain sentence embeddings. We evaluate the model on the Sentence Embeddings Benchmark.","status":"active","model_type":"embed","open_weight":true,"license":"apache-2.0","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"We present a sentence similarity model based on the Sentence Transformers architecture, which maps sentences to a 384-dimensional dense vector space."},{"id":"sesame/csm-1b","name":"csm-1b","created_by":"sesame","source":"official","last_updated":"2026-04-26","family":"sesame","description":"CSM (Conversational Speech Model) is a speech generation model from Sesame that generates RVQ audio codes from text and audio inputs. The model architecture employs a Llama backbone and a smaller audio decoder that produces Mimi audio codes.","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$7.0000 per 1M input characters"],"tagline":"CSM (Conversational Speech Model) is a speech generation model from Sesame that generates RVQ audio codes from text and audio inputs."},{"id":"shibing624/text2vec-base-chinese","name":"text2vec-base-chinese","created_by":"shibing624","source":"official","last_updated":"2026-04-26","family":"shibing624","description":"A sentence similarity model that can be used for various NLP tasks such as text classification, sentiment analysis, named entity recognition, question answering, and more. It utilizes the CoSENT architecture, which consists of a transformer encoder and a pooling module, to encode input texts into vectors that capture their semantic meaning. The model was trained on the nli_zh dataset and achieved high performance on various benchmark datasets.","status":"active","model_type":"embed","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"A sentence similarity model that can be used for various NLP tasks such as text classification, sentiment analysis, named entity recognition, question answering, and more."},{"id":"stabilityai/sdxl-turbo","name":"sdxl-turbo","created_by":"stability-ai","source":"official","last_updated":"2026-04-26","family":"sdxl","description":"The SDXL Turbo model, developed by Stability AI, is an optimized, fast text-to-image generative model. It is a distilled version of SDXL 1.0, leveraging Adversarial Diffusion Distillation (ADD) to generate high-quality images in less steps.","status":"active","model_type":"image","open_weight":true,"license":"stability-ai","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0002 per image unit (1024x1024 default)"],"tagline":"The SDXL Turbo model, developed by Stability AI, is an optimized, fast text-to-image generative model."},{"id":"stepfun-ai/Step-3.5-Flash","name":"Step-3.5-Flash","created_by":"stepfun","source":"official","last_updated":"2026-06-03","family":"step-3","description":"Step 3.5 Flash is an open-source reasoning model by StepFun with 196B total parameters (11B active) using Mixture of Experts. It features a 256K context window, deep reasoning, tool calling, and agentic capabilities, achieving 97.3 on AIME 2025 and 74.4% on SWE-bench Verified.","status":"active","model_type":"chat","context_window":262144,"open_weight":true,"license":"apache-2.0","capabilities":{"tool_call":true,"streaming":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.09,"output":0.3,"cached_input":0.02},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","tagline":"Step 3.5 Flash is an open-source reasoning model by StepFun with 196B total parameters (11B active) using Mixture of Experts."},{"id":"stepfun-ai/Step-3.7-Flash","name":"Step-3.7-Flash","created_by":"stepfun","source":"official","description":"Step 3.7 Flash is an open-source multimodal reasoning model by StepFun with 198B total parameters (11B active) using Mixture of Experts. It accepts text and image inputs and features a 256K context window, selectable reasoning effort, tool calling, and agentic capabilities for coding and search workflows, scoring 80.9% on GPQA Diamond and 56.3% on SWE-bench Pro.","status":"active","context_window":262144,"model_type":"chat","license":"apache-2.0","open_weight":true,"tagline":"Step 3.7 Flash is an open-source multimodal reasoning model by StepFun with 198B total parameters (11B active) using Mixture of Experts.","capabilities":{"tool_call":true,"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":1.15,"cached_input":0.04},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"modelopt","last_updated":"2026-06-18"},{"id":"thenlper/gte-base","name":"gte-base","created_by":"thenlper","source":"official","last_updated":"2026-04-26","family":"thenlper","description":"The GTE models are trained by Alibaba DAMO Academy. They are mainly based on the BERT framework and currently offer three different sizes of models, including GTE-large, GTE-base, and GTE-small. The GTE models are trained on a large-scale corpus of relevance text pairs, covering a wide range of domains and scenarios. This enables the GTE models to be applied to various downstream tasks of text embeddings, including information retrieval, semantic textual similarity, text reranking, etc.","status":"active","model_type":"embed","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The GTE models are trained by Alibaba DAMO Academy."},{"id":"thenlper/gte-large","name":"gte-large","created_by":"thenlper","source":"official","last_updated":"2026-04-26","family":"thenlper","description":"The GTE models are trained by Alibaba DAMO Academy. They are mainly based on the BERT framework and currently offer three different sizes of models, including GTE-large, GTE-base, and GTE-small. The GTE models are trained on a large-scale corpus of relevance text pairs, covering a wide range of domains and scenarios. This enables the GTE models to be applied to various downstream tasks of text embeddings, including information retrieval, semantic textual similarity, text reranking, etc.","status":"active","model_type":"embed","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["embeddings"],"tagline":"The GTE models are trained by Alibaba DAMO Academy."},{"id":"Wan-AI/Wan2.2-T2V-A14B","name":"Wan2.2-T2V-A14B","created_by":"wan-ai","source":"official","last_updated":"2026-04-26","family":"Wan2.2","description":"The Wan2.2 T2V A14B is a next-generation 14B-parameter video foundation model by Wan-AI featuring a novel two-stage denoising architecture. It produces 480P videos with improved visual coherence and detail, generating 2 or 5 second clips at 16fps from text prompts.","status":"active","model_type":"video","open_weight":true,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"tagline":"The Wan2.2 T2V A14B is a next-generation 14B-parameter video foundation model by Wan-AI featuring a novel two-stage denoising architecture."},{"id":"Wan-AI/Wan2.6-I2V","name":"Wan2.6-I2V","created_by":"wan-ai","source":"official","last_updated":"2026-04-26","family":"Wan2.6","description":"Turn any image into a video. Intelligent shot scheduling supports multi-shot storytelling, generating multi-shot narrative videos with consistent subjects, scenes, and atmosphere","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.10 / second"],"tagline":"Turn any image into a video."},{"id":"Wan-AI/Wan2.6-Image-Edit","name":"Wan2.6-Image-Edit","created_by":"wan-ai","source":"official","last_updated":"2026-04-26","family":"Wan2.6","description":"An all-round image generation model that supports joint text–image reasoning, multi-image creative fusion, commercial-grade consistency, aesthetic style transfer, and precise control of framing and lighting, significantly enhancing consistency, controllability, and expressiveness in image generation.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0300 per image unit (0x0 default)"],"tagline":"An all-round image generation model that supports joint text–image reasoning, multi-image creative fusion, commercial-grade consistency, aesthetic style transfer, and precise control of framing and li"},{"id":"Wan-AI/Wan2.6-T2I","name":"Wan2.6-T2I","created_by":"wan-ai","source":"official","last_updated":"2026-04-26","family":"Wan2.6","description":"Wan2.6 text to image, Upgraded visual quality, aesthetics, and instruction-following deliver precise style control, realistic portraits, long-text understanding, and broad historical/cultural IP coverage, enabling high-quality, highly expressive visual generation.","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0300 per image unit (0x0 default)"],"tagline":"Wan2.6 text to image, Upgraded visual quality, aesthetics, and instruction-following deliver precise style control, realistic portraits, long-text understanding, and broad historical/cultural IP cover"},{"id":"Wan-AI/Wan2.6-T2V","name":"Wan2.6-T2V","created_by":"wan-ai","source":"official","last_updated":"2026-04-26","family":"Wan2.6","description":"Turn any prompt into a smooth video. Intelligent shot scheduling supports multi-shot storytelling, generating multi-shot narrative videos with consistent subjects, scenes, and atmosphere","status":"active","model_type":"video","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.10 / second"],"tagline":"Turn any prompt into a smooth video."},{"id":"Wan-AI/Wan2.7-I2V","name":"Wan2.7-I2V","created_by":"wan-ai","source":"official","family":"Wan2.7","description":"Generates video content from images while stably preserving details such as subject, style, and text elements. Ensures visual consistency and information fidelity throughout dynamic transitions.","status":"active","model_type":"video","open_weight":false,"tagline":"Generates video content from images while stably preserving details such as subject, style, and text elements.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.10 / second"],"last_updated":"2026-06-03"},{"id":"Wan-AI/Wan2.7-Image-Edit","name":"Wan2.7-Image-Edit","created_by":"wan-ai","source":"official","last_updated":"2026-04-26","family":"Wan2.7","description":"Bleeding edge image model supporting generation and editing, text to image, text/image to sequential images, image editing, multi-image reference generation, and interactive editing. Delivers enhanced performance in text rendering, subject consistency, and complex instruction following","status":"active","model_type":"image","open_weight":false,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"pricing_notes":["$0.0300 per image unit (0x0 default)"],"tagline":"Bleeding edge image model supporting generation and editing, text to image, text/image to sequential images, image editing, multi-image reference generation, and interactive editing."},{"id":"Wan-AI/Wan2.7-R2V","name":"Wan2.7-R2V","created_by":"wan-ai","source":"official","family":"Wan2.7","description":"Accurately preserve the look and voice of people or objects from a reference video, supporting multi-reference co-creation.","status":"active","model_type":"video","open_weight":false,"tagline":"Accurately preserve the look and voice of people or objects from a reference video, supporting multi-reference co-creation.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"pricing_notes":["$0.10 / second"],"last_updated":"2026-06-03"},{"id":"XiaomiMiMo/MiMo-V2.5-Pro","name":"MiMo-V2.5-Pro","created_by":"xiaomimimo","source":"official","family":"mimo","description":"MiMo-V2.5-Pro is an open-source Mixture-of-Experts (MoE) language model with 1.02T total parameters and 42B active parameters. It utilizes the hybrid attention architecture and 3-layers Multi-Token Prediction (MTP) introduced in [MiMo-V2-Flash](https://github.com/XiaomiMiMo/MiMo-V2-Flash).","status":"active","context_window":1048576,"model_type":"chat","reasoning_tokens":true,"open_weight":true,"tagline":"MiMo-V2.5-Pro is an open-source Mixture-of-Experts (MoE) language model with 1.02T total parameters and 42B active parameters.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1,"output":3,"cached_input":0.2},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp8","last_updated":"2026-06-03"},{"id":"XiaomiMiMo/MiMo-V2.5-tts-voiceclone","name":"MiMo-V2.5-tts-voiceclone","created_by":"xiaomimimo","source":"official","family":"mimo","description":"Automatically convert input text into natural and fluent speech output. You can generate natural and vivid speech content by configuring parameters such as speech. Precisely replicate voices from audio samples to enable speech synthesis of any voice. style and voice.","status":"active","model_type":"tts","open_weight":false,"tagline":"Automatically convert input text into natural and fluent speech output.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$0.0000 per 1M input characters"],"last_updated":"2026-06-03"},{"id":"XiaomiMiMo/MiMo-V2.5-tts-voicedesign","name":"MiMo-V2.5-tts-voicedesign","created_by":"xiaomimimo","source":"official","family":"mimo","description":"Automatically convert input text into natural and fluent speech output. You can generate natural and vivid speech content by configuring parameters such as speech style and voice. Automatically generate voices from text descriptions, without requiring presets or audio samples.","status":"active","model_type":"tts","open_weight":false,"tagline":"Automatically convert input text into natural and fluent speech output.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$0.0000 per 1M input characters"],"last_updated":"2026-06-03"},{"id":"XiaomiMiMo/MiMo-V2.5-tts","name":"MiMo-V2.5-tts","created_by":"xiaomimimo","source":"official","family":"mimo","description":"Automatically convert input text into natural and fluent speech output. You can generate natural and vivid speech content by configuring parameters such as speech style and voice. Use the high-quality voices from the built-in voices list.","status":"active","model_type":"tts","open_weight":false,"tagline":"Automatically convert input text into natural and fluent speech output.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$0.0000 per 1M input characters"],"last_updated":"2026-06-03"},{"id":"XiaomiMiMo/MiMo-V2.5","name":"MiMo-V2.5","created_by":"xiaomimimo","source":"official","family":"mimo","description":"MiMo-V2.5 is a native omnimodal model with strong agentic capabilities, supporting text, image, video, and audio understanding within a unified architecture. Built upon the MiMo-V2-Flash backbone and extended with dedicated vision and audio encoders, it delivers robust performance across multimodal perception, long-context reasoning, and agentic workflows.","status":"active","context_window":262144,"model_type":"chat","reasoning_tokens":true,"open_weight":true,"tagline":"MiMo-V2.5 is a native omnimodal model with strong agentic capabilities, supporting text, image, video, and audio understanding within a unified architecture.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"vision":true,"streaming":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.4,"output":2,"cached_input":0.08},"tools":["function_calling"],"endpoints":["chat_completions"],"last_updated":"2026-06-03"},{"id":"zai-org/GLM-4.6","name":"GLM-4.6","created_by":"zhipu","source":"official","last_updated":"2026-04-26","family":"GLM-4.6","description":"Compared with GLM-4.5, GLM-4.6 brings several key improvements: Longer context window: The context window has been expanded from 128K to 200K tokens, enabling the model to handle more complex agentic tasks. Superior coding performance: The model achieves higher scores on code benchmarks and demonstrates better real-world performance in applications such as Claude Code、Cline、Roo Code and Kilo Code, including improvements in generating visually polished front-end pages. Advanced reasoning: GLM-...","status":"active","model_type":"chat","context_window":202752,"reasoning_tokens":true,"open_weight":true,"license":"mit","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.43,"output":1.74,"cached_input":0.08},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"Compared with GLM-4.5, GLM-4.6 brings several key improvements: Longer context window: The context window has been expanded from 128K to 200K tokens, enabling the model to handle more complex agentic tasks."},{"id":"zai-org/GLM-4.7-Flash","name":"GLM-4.7-Flash","created_by":"zhipu","source":"official","last_updated":"2026-04-26","family":"GLM-4.7","description":"GLM-4.7-Flash is a 30B-A3B MoE model. As the strongest model in the 30B class, GLM-4.7-Flash offers a new option for lightweight deployment that balances performance and efficiency.","status":"active","model_type":"chat","context_window":202752,"reasoning_tokens":true,"open_weight":true,"license":"mit","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.06,"output":0.4,"cached_input":0.01},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"bfloat16","tagline":"GLM-4.7-Flash is a 30B-A3B MoE model."},{"id":"zai-org/GLM-4.7","name":"GLM-4.7","created_by":"zhipu","source":"official","last_updated":"2026-04-26","family":"GLM-4.7","description":"GLM-4.7 is a state-of-the-art, multilingual Mixture-of-Experts (MoE) language model designed for complex reasoning, agentic coding, and tool use. Building on its predecessor GLM-4.6, it delivers significant improvements across key benchmarks, including multilingual SWE-bench, Terminal Bench, and reasoning-heavy evaluations like HLE. The model features advanced \"Interleaved Thinking\" and new \"Preserved Thinking\" modes, allowing it to reason before actions and maintain consistency across long, ...","status":"active","model_type":"chat","context_window":202752,"reasoning_tokens":true,"open_weight":true,"license":"mit","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.4,"output":1.75,"cached_input":0.08},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"GLM-4.7 is a state-of-the-art, multilingual Mixture-of-Experts (MoE) language model designed for complex reasoning, agentic coding, and tool use."},{"id":"zai-org/GLM-5.1","name":"GLM-5.1","created_by":"zhipu","source":"official","last_updated":"2026-04-26","family":"GLM-5.1","description":"GLM-5.1 is Z-AI's next-generation flagship model for agentic engineering, with significantly stronger coding capabilities than its predecessor. It achieves state-of-the-art performance on SWE-Bench Pro and leads GLM-5 by a wide margin on NL2Repo (repo generation) and Terminal-Bench 2.0 (real-world terminal tasks).","status":"active","model_type":"chat","context_window":202752,"reasoning_tokens":true,"open_weight":true,"license":"mit","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1.05,"output":3.5,"cached_input":0.205},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"GLM-5.1 is Z-AI's next-generation flagship model for agentic engineering, with significantly stronger coding capabilities than its predecessor."},{"id":"zai-org/GLM-5.2","name":"GLM-5.2","created_by":"zhipu","source":"official","family":"GLM-5.2","description":"GLM-5.2 is Z-AI's latest flagship model for long-horizon tasks. It marks a substantial leap in long-horizon task capability over its predecessor GLM-5.1 and, for the first time, delivers that capability on a **solid 1M-token context**.","status":"active","context_window":1048576,"model_type":"chat","reasoning_tokens":true,"license":"mit","open_weight":true,"tagline":"GLM-5.2 is Z-AI's latest flagship model for long-horizon tasks.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.95,"output":3,"cached_input":0.18},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","last_updated":"2026-06-29"},{"id":"zai-org/GLM-5","name":"GLM-5","created_by":"zhipu","source":"official","last_updated":"2026-04-26","family":"GLM-5","description":"GLM-5 is an advanced, open-source large language model designed for developers tackling the toughest challenges. It excels at long-context reasoning, multi-step tool orchestration, and complex systems engineering, making it the ideal choice for powering sophisticated agents and applications that require high-level cognitive tasks.","status":"active","model_type":"chat","context_window":202752,"reasoning_tokens":true,"open_weight":true,"license":"mit","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"reasoning":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.6,"output":2.08,"cached_input":0.12},"tools":["function_calling"],"endpoints":["chat_completions"],"quantization":"fp4","tagline":"GLM-5 is an advanced, open-source large language model designed for developers tackling the toughest challenges."},{"id":"Zyphra/Zonos-v0.1-hybrid","name":"Zonos-v0.1-hybrid","created_by":"zyphra","source":"official","last_updated":"2026-04-26","family":"zyphra","description":"Zonos-v0.1 is a leading open-weight text-to-speech model trained on more than 200k hours of varied multilingual speech, delivering expressiveness and quality on par with—or even surpassing—top TTS providers. Our model enables highly natural speech generation from text prompts when given a speaker embedding or audio prefix, and can accurately perform speech cloning when given a reference clip spanning just a few seconds. The conditioning setup also allows for fine control over speaking rate, p...","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$7.0000 per 1M input characters"],"tagline":"Zonos-v0.1 is a leading open-weight text-to-speech model trained on more than 200k hours of varied multilingual speech, delivering expressiveness and quality on par with—or even surpassing—top TTS providers."},{"id":"Zyphra/Zonos-v0.1-transformer","name":"Zonos-v0.1-transformer","created_by":"zyphra","source":"official","last_updated":"2026-04-26","family":"zyphra","description":"Zonos-v0.1 is a leading open-weight text-to-speech model trained on more than 200k hours of varied multilingual speech, delivering expressiveness and quality on par with—or even surpassing—top TTS providers. Our model enables highly natural speech generation from text prompts when given a speaker embedding or audio prefix, and can accurately perform speech cloning when given a reference clip spanning just a few seconds. The conditioning setup also allows for fine control over speaking rate, p...","status":"active","model_type":"tts","open_weight":true,"capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"pricing_notes":["$7.0000 per 1M input characters"],"tagline":"Zonos-v0.1 is a leading open-weight text-to-speech model trained on more than 200k hours of varied multilingual speech, delivering expressiveness and quality on par with—or even surpassing—top TTS providers."}]}; export const models: Model[] = provider.models.map((m) => ({ ...m, provider: provider.id })); diff --git a/packages/npm/src/providers/fal.ts b/packages/npm/src/providers/fal.ts index f30277fae..d9d9c8d7f 100644 --- a/packages/npm/src/providers/fal.ts +++ b/packages/npm/src/providers/fal.ts @@ -3,6 +3,6 @@ import type { ProviderWithModels, Model } from '../types'; -export const provider: ProviderWithModels = {"id":"fal","name":"fal","region":"US","url":"https://fal.ai","api_url":"https://fal.run","docs_url":"https://fal.ai/docs","pricing_url":"https://fal.ai/pricing","description":"Generative media inference platform for image, video, audio, and multimodal model APIs.","type":"cloud","models_url":"https://api.fal.ai/v1/models","openai_compatible":false,"free_tier":false,"github_url":"https://github.com/fal-ai","twitter_url":"https://x.com/fal","icon":"\n \n","models":[{"id":"alibaba/happy-horse/image-to-video","name":"Happy Horse","created_by":"alibaba","source":"official","description":"Alibaba's #1-ranked Happy Horse 1.0 — generate 1080p video with synchronized native audio and multilingual lip-sync from text prompts or images.","status":"active","release_date":"2026-04-24","model_type":"video","page_url":"https://fal.run/alibaba/happy-horse/image-to-video","tagline":"Alibaba's #1-ranked Happy Horse 1.0 — generate 1080p video with synchronized native audio and multilingual lip-sync from text prompts or images.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"alibaba/happy-horse/reference-to-video","name":"Happy Horse","created_by":"alibaba","source":"official","description":"Generate 1080p video with synchronized native audio from a text prompt and references.","status":"active","release_date":"2026-04-27","model_type":"video","page_url":"https://fal.run/alibaba/happy-horse/reference-to-video","tagline":"Generate 1080p video with synchronized native audio from a text prompt and references.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"alibaba/happy-horse/text-to-video","name":"Happy Horse","created_by":"alibaba","source":"official","description":"Generate 1080p video with synchronized native audio from a text prompt.","status":"active","release_date":"2026-04-24","model_type":"video","page_url":"https://fal.run/alibaba/happy-horse/text-to-video","tagline":"Generate 1080p video with synchronized native audio from a text prompt.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"alibaba/happy-horse/v1.1/image-to-video","name":"Happy Horse 1.1 Image to Video","created_by":"alibaba","source":"official","description":"Happy Horse 1.1 is Alibaba's #1-ranked video model.","status":"active","release_date":"2026-06-21","model_type":"video","page_url":"https://fal.run/alibaba/happy-horse/v1.1/image-to-video","tagline":"Happy Horse 1.1 is Alibaba's #1-ranked video model.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"alibaba/happy-horse/v1.1/reference-to-video","name":"Happy Horse 1.1 Reference to Video","created_by":"alibaba","source":"official","description":"Happy Horse 1.1 is Alibaba's #1-ranked video model.","status":"active","release_date":"2026-06-21","model_type":"video","page_url":"https://fal.run/alibaba/happy-horse/v1.1/reference-to-video","tagline":"Happy Horse 1.1 is Alibaba's #1-ranked video model.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"alibaba/happy-horse/v1.1/text-to-video","name":"Happy Horse 1.1 Text to Video","created_by":"alibaba","source":"official","description":"Happy Horse 1.1 is Alibaba's #1-ranked video model.","status":"active","release_date":"2026-06-21","model_type":"video","page_url":"https://fal.run/alibaba/happy-horse/v1.1/text-to-video","tagline":"Happy Horse 1.1 is Alibaba's #1-ranked video model.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"alibaba/happy-horse/video-edit","name":"Happy Horse Video Edit","created_by":"alibaba","source":"official","description":"HappyHorse video editing supports advanced video editing through natural language instructions.","status":"active","release_date":"2026-04-27","model_type":"other","page_url":"https://fal.run/alibaba/happy-horse/video-edit","tagline":"HappyHorse video editing supports advanced video editing through natural language instructions.","capabilities":{"vision":true},"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"argil/avatars/audio-to-video","name":"Avatars Audio to Video","created_by":"argil","source":"official","description":"High-quality avatar videos that feel real, generated from your audio","status":"active","release_date":"2025-09-01","model_type":"other","page_url":"https://fal.run/argil/avatars/audio-to-video","tagline":"High-quality avatar videos that feel real, generated from your audio","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"argil/avatars/text-to-video","name":"Avatars Text to Video","created_by":"argil","source":"official","description":"High-quality avatar videos that feel real, generated from your text","status":"active","release_date":"2025-09-01","model_type":"video","page_url":"https://fal.run/argil/avatars/text-to-video","tagline":"High-quality avatar videos that feel real, generated from your text","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"async/tts-pro/v1.0","name":"Async Text to Speech Pro V1.0","created_by":"async","source":"official","family":"tts","description":"Generate professional-quality voiceovers in seconds with Async TTS Pro model text-based control over pauses, emphasis, and timing.","status":"active","release_date":"2026-06-18","model_type":"tts","page_url":"https://fal.run/async/tts-pro/v1.0","tagline":"Generate professional-quality voiceovers in seconds with Async TTS Pro model text-based control over pauses, emphasis, and timing.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-18","last_updated":"2026-06-20"},{"id":"bria/bria_video_eraser/erase/keypoints","name":"Bria Video Eraser","created_by":"bria","source":"official","description":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency.","status":"active","release_date":"2025-12-17","model_type":"other","page_url":"https://fal.run/bria/bria_video_eraser/erase/keypoints","tagline":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"bria/bria_video_eraser/erase/mask","name":"Bria Video Eraser Erase Mask","created_by":"bria","source":"official","description":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency.","status":"active","release_date":"2025-12-17","model_type":"other","page_url":"https://fal.run/bria/bria_video_eraser/erase/mask","tagline":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency.","last_seen_at":"2026-01-26","last_updated":"2026-06-03"},{"id":"bria/bria_video_eraser/erase/prompt","name":"Bria Video Eraser","created_by":"bria","source":"official","description":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency","status":"active","release_date":"2025-12-17","model_type":"other","page_url":"https://fal.run/bria/bria_video_eraser/erase/prompt","tagline":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"bria/embed-product","name":"Embed Product","created_by":"bria","source":"official","family":"embed","description":"Seamlessly embed products into any scene with pixel-perfect control, automatic perspective, and natural lighting.","status":"active","release_date":"2026-02-25","model_type":"image","page_url":"https://fal.run/bria/embed-product","tagline":"Seamlessly integrate one or more products into a predefined scene with pixel-perfect control.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-bbq-preview/generate","name":"Fibo Bbq Preview","created_by":"bria","source":"official","description":"A preview to the next level of control of Text-to-Image models.","status":"active","release_date":"2026-03-02","model_type":"image","page_url":"https://fal.run/bria/fibo-bbq-preview/generate","tagline":"A preview to the next level of control of Text-to-Image models.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-02","last_updated":"2026-05-11"},{"id":"bria/fibo-edit/add_object_by_text","name":"Fibo Edit [Add Object by Text]","created_by":"bria","source":"official","description":"Precisely insert new objects into images with structured spatial commands.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/add_object_by_text","tagline":"Precise, context-aware insertion of new objects into an existing image using simple, structured spatial commands.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/blend","name":"Fibo Edit [Blend]","created_by":"bria","source":"official","description":"image composition model.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/blend","tagline":"Complex, multi-step visual composition through natural language.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/colorize","name":"Fibo Edit [Colorize]","created_by":"bria","source":"official","description":"Image colorization and color-grading model.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/colorize","tagline":"Transforms the color treatment of images using predefined, style-based commands","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/edit/structured_instruction","name":"Fibo Edit [Structured Instruction]","created_by":"bria","source":"official","description":"Structured Instructions Generation endpoint for Fibo Edit, Bria's newest editing model.","status":"active","release_date":"2026-01-20","model_type":"other","page_url":"https://fal.run/bria/fibo-edit/edit/structured_instruction","tagline":"Structured Instructions Generation endpoint for Fibo Edit, Bria's newest editing model.","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"bria/fibo-edit/edit","name":"Fibo Edit","created_by":"bria","source":"official","description":"High-fidelity image editing model with state-of-the-art controllability.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/edit","tagline":"A high-quality editing model that achieves maximum controllability and transparency by combining JSON + Mask + Image.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/erase_by_text","name":"Fibo Edit [Erase by Text]","created_by":"bria","source":"official","description":"Remove unwanted objects from images with a text prompt - fast, precise editing that seamlessly blends results.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/erase_by_text","tagline":"Fast, reliable removal of unwanted elements from images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/relight","name":"Fibo Edit [Relight]","created_by":"bria","source":"official","description":"Precise, controllable photo re-lighting with structured text inputs.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/relight","tagline":"Precise, controllable lighting changes using simple, structured text inputs.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/replace_object_by_text","name":"Fibo Edit [Replace Object by Text]","created_by":"bria","source":"official","description":"Replace any object in an image using plain language with fine-grained, precise edits and strong prompt adherence.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/replace_object_by_text","tagline":"Natural, expressive object swapping within images using plain language","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/reseason","name":"Fibo Edit [Reseason]","created_by":"bria","source":"official","description":"Transform the season or weather of an image - summer to winter, sunny to rainy - with realistic atmosphere and lighting.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/reseason","tagline":"Transforms the seasonal or weather atmosphere of an image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/restore","name":"Fibo Edit [Restore]","created_by":"bria","source":"official","description":"Photo restoration model that automatically denoises, deblurs, and enhances old or damaged photos - removes imperfections while preserving original character.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/restore","tagline":"Automatically renews and cleans noisy or degraded images.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/restyle","name":"Fibo Edit [Restyle]","created_by":"bria","source":"official","description":"Production-grade style transfer that maps photos to distinct artistic styles using curated, brand-safe presets.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/restyle","tagline":"Transforms images into distinct artistic styles using curated, production-grade style mappings","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/rewrite_text","name":"Fibo Edit [Rewrite Text]","created_by":"bria","source":"official","description":"Precisely rewrite text inside images while preserving typography, fonts, and layout.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/rewrite_text","tagline":"Precise, reliable modification of existing text inside images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/sketch_to_colored_image","name":"Fibo Edit [Sketch to Image]","created_by":"bria","source":"official","description":"Convert line drawings and sketches into photorealistic, fully colored images with preserved structure.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/sketch_to_colored_image","tagline":"Converts line drawings and sketches into photorealistic, fully colored images","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo/generate/structured_prompt","name":"Fibo","created_by":"bria","source":"official","description":"Structured Prompt Generation endpoint for Fibo, Bria's SOTA Open source model.","status":"active","release_date":"2025-10-29","model_type":"other","page_url":"https://fal.run/bria/fibo/generate/structured_prompt","tagline":"Structured Prompt Generation endpoint for Fibo, Bria's SOTA Open source model","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo/generate","name":"Fibo","created_by":"bria","source":"official","description":"SOTA open-source text-to-image model delivering high-fidelity outputs with accurate typography.","status":"active","release_date":"2025-10-29","model_type":"image","page_url":"https://fal.run/bria/fibo/generate","tagline":"SOTA Open source model trained on licensed data, transforming intent into structured control for precise, high-quality AI image generation in enterprise and agentic workflows.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-lite/generate/structured_prompt/lite","name":"Fibo Lite","created_by":"bria","source":"official","description":"Structured Prompt Generation endpoint for Fibo-Lite, Bria's SOTA Open source model","status":"active","release_date":"2026-01-19","model_type":"other","page_url":"https://fal.run/bria/fibo-lite/generate/structured_prompt/lite","tagline":"Structured Prompt Generation endpoint for Fibo-Lite, Bria's SOTA Open source model","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"bria/fibo-lite/generate/structured_prompt","name":"Fibo Lite","created_by":"bria","source":"official","description":"Convert plain text into Fibo-Lite's transparent JSON-structured prompts - Bria's unique controllability layer that no closed model offers.","status":"active","release_date":"2026-01-19","model_type":"other","page_url":"https://fal.run/bria/fibo-lite/generate/structured_prompt","tagline":"Structured Prompt Generation endpoint for Fibo-Lite, Bria's SOTA Open source model","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-lite/generate","name":"Fibo Lite","created_by":"bria","source":"official","description":"Fast, low-latency text-to-image model with high-quality output and full JSON-structured controllability.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/bria/fibo-lite/generate","tagline":"Fibo Lite, the new addition to the Fibo model family, allows generating high-quality images with the same controllability of the JSON structured prompt with significantly improved latency.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/genfill/v2","name":"Genfill","created_by":"bria","source":"official","description":"The GenFill Route enables the generation of objects by prompt in a specific region of an image.","status":"active","release_date":"2026-06-08","model_type":"image","page_url":"https://fal.run/bria/genfill/v2","tagline":"The GenFill Route enables the generation of objects by prompt in a specific region of an image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-10","last_updated":"2026-06-18"},{"id":"bria/reimagine/3.2","name":"Reimagine","created_by":"bria","source":"official","description":"Reimagine uses a structure reference for generating new images while preserving the structure of an input image, guided by text prompts.","status":"active","release_date":"2025-08-20","model_type":"image","page_url":"https://fal.run/bria/reimagine/3.2","tagline":"Reimagine uses a structure reference for generating new images while preserving the structure of an input image, guided by text prompts.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"bria/replace-background","name":"Replace Background","created_by":"bria","source":"official","description":"Generate professional, eCommerce-ready product shots by replacing backgrounds with realistic lighting and accurate perspective from a simple text prompt.","status":"active","release_date":"2026-01-27","model_type":"image","page_url":"https://fal.run/bria/replace-background","tagline":"Creates enriched product shots by placing them in various environments using textual descriptions.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/text-to-image/3.2","name":"Bria 3.2 Text-to-Image","created_by":"bria","source":"official","description":"Bria’s Text-to-Image model, trained exclusively on licensed data for safe and risk-free commercial use.","status":"active","release_date":"2025-06-17","model_type":"image","page_url":"https://fal.run/bria/text-to-image/3.2","tagline":"Bria’s Text-to-Image model, trained exclusively on licensed data for safe and risk-free commercial use.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"bria/upscale/creative","name":"Upscale","created_by":"bria","source":"official","description":"Professional-grade creative upscaler that doubles resolution up to 10MP, regenerating sharper textures, refined details, and cleaner faces.","status":"active","release_date":"2026-02-23","model_type":"image","page_url":"https://fal.run/bria/upscale/creative","tagline":"Regenerate the image with sharper textures and richer details while doubling resolution, up to 10 megapixels output.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/video/background-removal/realtime","name":"Bria's VRMBG 3.0 Realtime","created_by":"bria","source":"official","description":"Remove video backgrounds in real time with Bria’s VRMBG 3.0 model.","status":"active","release_date":"2026-06-09","model_type":"other","page_url":"https://fal.run/bria/video/background-removal/realtime","tagline":"Remove video backgrounds in real time with Bria’s VRMBG 3.0 model.","last_seen_at":"2026-06-14","last_updated":"2026-06-18"},{"id":"bria/video/background-removal/v3","name":"Bria's VRMBG 3.0","created_by":"bria","source":"official","description":"Remove backgrounds from any video with Bria's VRMBG 3.0.","status":"active","release_date":"2026-06-08","model_type":"other","page_url":"https://fal.run/bria/video/background-removal/v3","tagline":"Remove backgrounds from any video with Bria's VRMBG 3.0.","last_seen_at":"2026-06-14","last_updated":"2026-06-18"},{"id":"bria/video/background-removal","name":"Video","created_by":"bria","source":"official","description":"Automatically remove backgrounds from videos -perfect for creating clean, professional content without a green screen.","status":"active","release_date":"2025-06-30","model_type":"other","page_url":"https://fal.run/bria/video/background-removal","tagline":"Automatically remove backgrounds from videos -perfect for creating clean, professional content without a green screen.","last_seen_at":"2026-06-14","last_updated":"2026-06-18"},{"id":"bria/video/erase/keypoints","name":"Video","created_by":"bria","source":"official","description":"High-fidelity keypoint-driven video object removal - minimal input, strong temporal consistency.","status":"active","release_date":"2025-12-23","model_type":"other","page_url":"https://fal.run/bria/video/erase/keypoints","tagline":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency.","last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/video/erase/mask","name":"Video","created_by":"bria","source":"official","description":"High-fidelity mask-based video object removal with strong temporal consistency.","status":"active","release_date":"2025-12-23","model_type":"other","page_url":"https://fal.run/bria/video/erase/mask","tagline":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency.","last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/video/erase/prompt","name":"Video","created_by":"bria","source":"official","description":"Erase unwanted objects, people, or elements from video with a text prompt.","status":"active","release_date":"2025-12-23","model_type":"other","page_url":"https://fal.run/bria/video/erase/prompt","tagline":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency","last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/video/increase-resolution","name":"Video","created_by":"bria","source":"official","description":"Professional-grade video upscaler with strong temporal consistency, enhancing videos up to 8K resolution.","status":"active","release_date":"2025-08-26","model_type":"other","page_url":"https://fal.run/bria/video/increase-resolution","tagline":"Upscale videos up to 8K output resolution.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"bytedance/lynx","name":"Lynx","created_by":"bytedance","source":"official","description":"Generate subject consistent videos using Lynx from ByteDance!","status":"active","release_date":"2025-11-18","model_type":"video","page_url":"https://fal.run/bytedance/lynx","tagline":"Generate subject consistent videos using Lynx from ByteDance!","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"bytedance/seed-audio-1.0","name":"Seed Audio 1.0","created_by":"bytedance","source":"official","description":"Seed Audio 1.0 is a new audio model from Bytedance that can generate high-quality, natural sounding audio using text, reference audios or an image.","status":"active","release_date":"2026-06-25","model_type":"other","page_url":"https://fal.run/bytedance/seed-audio-1.0","tagline":"Seed Audio 1.0 is a new audio model from Bytedance that can generate high-quality, natural sounding audio using text, reference audios or an image.","capabilities":{"vision":true},"last_seen_at":"2026-06-26","last_updated":"2026-06-29"},{"id":"bytedance/seedance-2.0/fast/image-to-video","name":"Seedance 2.0 Fast Image to Video","created_by":"bytedance","source":"official","description":"ByteDance's most advanced image-to-video model, fast tier.","status":"active","release_date":"2026-04-01","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/fast/image-to-video","tagline":"ByteDance's most advanced image-to-video model, fast tier.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-22","last_updated":"2026-05-11"},{"id":"bytedance/seedance-2.0/fast/reference-to-video","name":"Seedance 2.0 Fast Reference to Video","created_by":"bytedance","source":"official","description":"ByteDance's most advanced reference-to-video model, fast tier.","status":"active","release_date":"2026-04-01","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/fast/reference-to-video","tagline":"ByteDance's most advanced reference-to-video model, fast tier.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-05-29","last_updated":"2026-06-03"},{"id":"bytedance/seedance-2.0/fast/text-to-video","name":"Seedance 2.0 Fast Text to Video","created_by":"bytedance","source":"official","description":"ByteDance's most advanced text-to-video model, fast tier.","status":"active","release_date":"2026-04-01","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/fast/text-to-video","tagline":"ByteDance's most advanced text-to-video model, fast tier.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-05-29","last_updated":"2026-06-03"},{"id":"bytedance/seedance-2.0/image-to-video","name":"Seedance 2 Image to Video","created_by":"bytedance","source":"official","description":"ByteDance's most advanced image-to-video model.","status":"active","release_date":"2026-04-01","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/image-to-video","tagline":"ByteDance's most advanced image-to-video model.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"bytedance/seedance-2.0/mini/image-to-video","name":"Seedance 2.0 Mini Image to Video","created_by":"bytedance","source":"official","description":"Seedance 2.0 Mini is a faster version of Seedance 2.0 that brings great performance and high generation speed at a lower cost.","status":"active","release_date":"2026-06-23","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/mini/image-to-video","tagline":"Seedance 2.0 Mini is a faster version of Seedance 2.0 that brings great performance and high generation speed at a lower cost.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"bytedance/seedance-2.0/mini/reference-to-video","name":"Seedance 2.0 Mini","created_by":"bytedance","source":"official","description":"Seedance 2.0 Mini is a faster version of Seedance 2.0 that brings great performance and high generation speed at a lower cost.","status":"active","release_date":"2026-06-23","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/mini/reference-to-video","tagline":"Seedance 2.0 Mini is a faster version of Seedance 2.0 that brings great performance and high generation speed at a lower cost.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"bytedance/seedance-2.0/mini/text-to-video","name":"Seedance 2.0 Mini Text to Video","created_by":"bytedance","source":"official","description":"Seedance 2.0 Mini is a faster version of Seedance 2.0 that brings great performance and high generation speed at a lower cost.","status":"active","release_date":"2026-06-23","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/mini/text-to-video","tagline":"Seedance 2.0 Mini is a faster version of Seedance 2.0 that brings great performance and high generation speed at a lower cost.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"bytedance/seedance-2.0/reference-to-video","name":"Seedance 2 Reference to Video","created_by":"bytedance","source":"official","description":"ByteDance's most advanced reference-to-video model.","status":"active","release_date":"2026-04-01","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/reference-to-video","tagline":"ByteDance's most advanced reference-to-video model.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"bytedance/seedance-2.0/text-to-video","name":"Seedance 2.0 Text to Video API","created_by":"bytedance","source":"official","description":"ByteDance's most advanced text-to-video model.","status":"active","release_date":"2026-04-01","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/text-to-video","tagline":"ByteDance's most advanced text-to-video model.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-23","last_updated":"2026-06-29"},{"id":"cassetteai/music-generator","name":"music generator","created_by":"cassetteai","source":"official","description":"CassetteAI’s model generates a 30-second sample in under 2 seconds and a full 3-minute track in under 10 seconds.","status":"active","release_date":"2025-03-27","model_type":"other","page_url":"https://fal.run/CassetteAI/music-generator","tagline":"CassetteAI’s model generates a 30-second sample in under 2 seconds and a full 3-minute track in under 10 seconds.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"cassetteai/sound-effects-generator","name":"Sound Effects Generator","created_by":"cassetteai","source":"official","description":"Create stunningly realistic sound effects in seconds - CassetteAI's Sound Effects Model generates high-quality SFX up to 30 seconds long in just 1 second of processing time","status":"active","release_date":"2025-04-03","model_type":"other","page_url":"https://fal.run/cassetteai/sound-effects-generator","tagline":"Create stunningly realistic sound effects in seconds - CassetteAI's Sound Effects Model generates high-quality SFX up to 30 seconds long in just 1 second of processing time","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"cassetteai/video-sound-effects-generator","name":"Video Sound Effects Generator","created_by":"cassetteai","source":"official","description":"Add sound effects to your videos","status":"active","release_date":"2025-04-07","model_type":"other","page_url":"https://fal.run/cassetteai/video-sound-effects-generator","tagline":"Add sound effects to your videos","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"clarityai/crystal-upscaler","name":"Crystal Upscaler","created_by":"clarityai","source":"official","description":"An advanced image enhancement tool designed specifically for facial details and portrait photography, utilizing Clarity AI's upscaling technology.","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/clarityai/crystal-upscaler","tagline":"An advanced image enhancement tool designed specifically for facial details and portrait photography, utilizing Clarity AI's upscaling technology.","capabilities":{"vision":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"tools":["function_calling"],"last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"clarityai/crystal-video-upscaler","name":"Crystal Upscaler [Video]","created_by":"clarityai","source":"official","description":"Do high precision video upscaling that respects the original video perfectly using Crystal Upscaler's new video upscaling method!","status":"active","release_date":"2025-12-17","model_type":"other","page_url":"https://fal.run/clarityai/crystal-video-upscaler","tagline":"Do high precision video upscaling that respects the original video perfectly using Crystal Upscaler's new video upscaling method!","last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"decart/lucy-edit/pro","name":"Lucy Edit [Pro]","created_by":"decart","source":"official","description":"Edit outfits, objects, faces, or restyle your video - all with maximum detail retention.","status":"active","release_date":"2025-09-18","model_type":"other","page_url":"https://fal.run/decart/lucy-edit/pro","tagline":"Edit outfits, objects, faces, or restyle your video - all with maximum detail retention.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"decart/lucy-restyle","name":"Lucy Restyle","created_by":"decart","source":"official","description":"Restyle videos up to 30 min long - maintaining maximum detail quality.","status":"active","release_date":"2025-12-18","model_type":"other","page_url":"https://fal.run/decart/lucy-restyle","tagline":"Restyle videos up to 30 min long - maintaining maximum detail quality.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"decart/lucy2-vton/realtime","name":"Lucy 2.1 VTON Realtime","created_by":"decart","source":"official","description":"Realtime Try On experience with Decart Lucy 2.1 VTON","status":"active","release_date":"2026-04-29","model_type":"other","page_url":"https://fal.run/decart/lucy2-vton/realtime","tagline":"Realtime Try On experience with Decart Lucy 2.1 VTON","last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/ace-step/audio-inpaint","name":"ACE Step Audio Inpaint","created_by":"fal","source":"official","description":"Modify a portion of provided audio with lyrics and/or style using ACE-Step","status":"active","release_date":"2025-05-11","model_type":"other","page_url":"https://fal.run/fal-ai/ace-step/audio-inpaint","tagline":"Modify a portion of provided audio with lyrics and/or style using ACE-Step","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/ace-step/audio-outpaint","name":"ACE Step Audio Outpaint","created_by":"fal","source":"official","description":"Extend the beginning or end of provided audio with lyrics and/or style using ACE-Step","status":"active","release_date":"2025-05-11","model_type":"other","page_url":"https://fal.run/fal-ai/ace-step/audio-outpaint","tagline":"Extend the beginning or end of provided audio with lyrics and/or style using ACE-Step","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/ace-step/audio-to-audio","name":"ACE Step Audio To Audio","created_by":"fal","source":"official","description":"Generate music from a lyrics and example audio using ACE-Step","status":"active","release_date":"2025-05-11","model_type":"other","page_url":"https://fal.run/fal-ai/ace-step/audio-to-audio","tagline":"Generate music from a lyrics and example audio using ACE-Step","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ace-step/prompt-to-audio","name":"ACE Step Prompt To Audio","created_by":"fal","source":"official","description":"Generate music from a simple prompt using ACE-Step","status":"active","release_date":"2025-05-11","model_type":"other","page_url":"https://fal.run/fal-ai/ace-step/prompt-to-audio","tagline":"Generate music from a simple prompt using ACE-Step","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ace-step","name":"ACE Step","created_by":"fal","source":"official","description":"Generate music with lyrics from text using ACE-Step","status":"active","release_date":"2025-05-08","model_type":"other","page_url":"https://fal.run/fal-ai/ace-step","tagline":"Generate music with lyrics from text using ACE-Step","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ai-avatar/multi-text","name":"AI Avatar Multi Text","created_by":"fal","source":"official","description":"MultiTalk model generates a multi-person conversation video from an image and text inputs.","status":"active","release_date":"2025-06-23","model_type":"video","page_url":"https://fal.run/fal-ai/ai-avatar/multi-text","tagline":"MultiTalk model generates a multi-person conversation video from an image and text inputs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/ai-avatar/multi","name":"AI Avatar Multi","created_by":"fal","source":"official","description":"MultiTalk model generates a multi-person conversation video from an image and audio files.","status":"active","release_date":"2025-06-23","model_type":"video","page_url":"https://fal.run/fal-ai/ai-avatar/multi","tagline":"MultiTalk model generates a multi-person conversation video from an image and audio files.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/ai-avatar/single-text","name":"AI Avatar Single Text","created_by":"fal","source":"official","description":"MultiTalk model generates a talking avatar video from an image and text.","status":"active","release_date":"2025-06-23","model_type":"video","page_url":"https://fal.run/fal-ai/ai-avatar/single-text","tagline":"MultiTalk model generates a talking avatar video from an image and text.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ai-avatar","name":"Ai Avatar","created_by":"fal","source":"official","description":"MultiTalk model generates a talking avatar video from an image and audio file.","status":"active","release_date":"2025-06-23","model_type":"video","page_url":"https://fal.run/fal-ai/ai-avatar","tagline":"MultiTalk model generates a talking avatar video from an image and audio file.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/amt-interpolation/frame-interpolation","name":"AMT Frame Interpolation","created_by":"fal","source":"official","description":"Interpolate between image frames","status":"active","release_date":"2024-07-18","model_type":"video","page_url":"https://fal.run/fal-ai/amt-interpolation/frame-interpolation","tagline":"Interpolate between image frames","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/amt-interpolation","name":"AMT Interpolation","created_by":"fal","source":"official","description":"Interpolate between video frames","status":"active","release_date":"2024-02-21","model_type":"other","page_url":"https://fal.run/fal-ai/amt-interpolation","tagline":"Interpolate between video frames","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/animatediff-sparsectrl-lcm","name":"Animatediff SparseCtrl LCM","created_by":"fal","source":"official","description":"Animate Your Drawings with Latent Consistency Models!","status":"active","release_date":"2023-11-09","model_type":"video","page_url":"https://fal.run/fal-ai/animatediff-sparsectrl-lcm","tagline":"Animate Your Drawings with Latent Consistency Models!","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/arbiter/image/image","name":"Arbiter","created_by":"fal","source":"official","description":"Image reference comparison measurements","status":"active","release_date":"2025-12-26","model_type":"other","page_url":"https://fal.run/fal-ai/arbiter/image/image","tagline":"Image reference comparison measurements","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/arbiter/image/text","name":"Arbiter","created_by":"fal","source":"official","description":"Semantic image alignment measurements","status":"active","release_date":"2025-12-26","model_type":"other","page_url":"https://fal.run/fal-ai/arbiter/image/text","tagline":"Semantic image alignment measurements","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/arbiter/image","name":"Arbiter","created_by":"fal","source":"official","description":"Reference-free image measurements","status":"active","release_date":"2025-12-26","model_type":"other","page_url":"https://fal.run/fal-ai/arbiter/image","tagline":"Reference-free image measurements","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/audio-understanding","name":"Audio Understanding","created_by":"fal","source":"official","description":"A audio understanding model to analyze audio content and answer questions about what's happening in the audio based on user prompts.","status":"active","release_date":"2025-10-24","model_type":"other","page_url":"https://fal.run/fal-ai/audio-understanding","tagline":"A audio understanding model to analyze audio content and answer questions about what's happening in the audio based on user prompts.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/aura-flow","name":"AuraFlow","created_by":"fal","source":"official","description":"AuraFlow v0.3 is an open-source flow-based text-to-image generation model that achieves state-of-the-art results on GenEval.","status":"active","release_date":"2024-12-02","model_type":"image","page_url":"https://fal.run/fal-ai/aura-flow","tagline":"AuraFlow v0.3 is an open-source flow-based text-to-image generation model that achieves state-of-the-art results on GenEval.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-05","last_updated":"2026-05-11"},{"id":"fal-ai/aura-sr","name":"AuraSR","created_by":"fal","source":"official","description":"Upscale your images with AuraSR.","status":"active","release_date":"2024-04-11","model_type":"image","page_url":"https://fal.run/fal-ai/aura-sr","tagline":"Upscale your images with AuraSR.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-05","last_updated":"2026-05-11"},{"id":"fal-ai/auto-caption","name":"Auto-Captioner","created_by":"fal","source":"official","description":"Automatically generates text captions for your videos from the audio as per text colour/font specifications","status":"active","release_date":"2025-01-03","model_type":"other","page_url":"https://fal.run/fal-ai/auto-caption","tagline":"Automatically generates text captions for your videos from the audio as per text colour/font specifications","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bagel/edit","name":"Bagel","created_by":"fal","source":"official","description":"Bagel is a 7B parameter multimodal model from Bytedance-Seed that can generate both images and text.","status":"active","release_date":"2025-05-21","model_type":"image","page_url":"https://fal.run/fal-ai/bagel/edit","tagline":"Bagel is a 7B parameter multimodal model from Bytedance-Seed that can generate both images and text.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bagel/understand","name":"Bagel","created_by":"fal","source":"official","description":"Bagel is a 7B parameter multimodal model from Bytedance-Seed that can generate both text and images.","status":"active","release_date":"2025-05-21","model_type":"other","page_url":"https://fal.run/fal-ai/bagel/understand","tagline":"Bagel is a 7B parameter multimodal model from Bytedance-Seed that can generate both text and images.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/bagel","name":"Bagel","created_by":"fal","source":"official","description":"Bagel is a 7B parameter from Bytedance-Seed multimodal model that can generate both text and images.","status":"active","release_date":"2025-05-21","model_type":"image","page_url":"https://fal.run/fal-ai/bagel","tagline":"Bagel is a 7B parameter from Bytedance-Seed multimodal model that can generate both text and images.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ben/v2/image","name":"ben-v2-image","created_by":"fal","source":"official","description":"A fast and high quality model for image background removal.","status":"active","release_date":"2025-02-11","model_type":"image","page_url":"https://fal.run/fal-ai/ben/v2/image","tagline":"A fast and high quality model for image background removal.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ben/v2/video","name":"Ben-Video-Bg-Rm","created_by":"fal","source":"official","description":"A model for high quality and smooth background removal for videos.","status":"active","release_date":"2025-02-11","model_type":"other","page_url":"https://fal.run/fal-ai/ben/v2/video","tagline":"A model for high quality and smooth background removal for videos.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bernini-r/edit-image","name":"Bernini-R Edit Image","created_by":"fal","source":"official","description":"Edit any image with a natural-language instruction using Bernini-R, changing the weather, materials, objects, or style while preserving the original composition.","status":"active","release_date":"2026-06-08","model_type":"image","page_url":"https://fal.run/fal-ai/bernini-r/edit-image","tagline":"Edit any image with a natural-language instruction using Bernini-R, changing the weather, materials, objects, or style while preserving the original composition.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-09","last_updated":"2026-06-10"},{"id":"fal-ai/bernini-r/edit-video","name":"Bernini-R Edit Video","created_by":"fal","source":"official","description":"Edit any video with a natural-language instruction using Bernini-R, changing objects, weather, background, or camera angle while keeping the rest of the scene intact.","status":"active","release_date":"2026-06-08","model_type":"other","page_url":"https://fal.run/fal-ai/bernini-r/edit-video","tagline":"Edit any video with a natural-language instruction using Bernini-R, changing objects, weather, background, or camera angle while keeping the rest of the scene intact.","last_seen_at":"2026-06-09","last_updated":"2026-06-10"},{"id":"fal-ai/bernini-r/reference-edit-video","name":"Bernini-R Reference Edit Video","created_by":"fal","source":"official","description":"Edit a video guided by reference images with Bernini-R, bringing an object, material, background, style, or weather from a reference image into your video.","status":"active","release_date":"2026-06-08","model_type":"other","page_url":"https://fal.run/fal-ai/bernini-r/reference-edit-video","tagline":"Edit a video guided by reference images with Bernini-R, bringing an object, material, background, style, or weather from a reference image into your video.","capabilities":{"vision":true},"last_seen_at":"2026-06-09","last_updated":"2026-06-10"},{"id":"fal-ai/bernini-r/reference-to-video","name":"Bernini-R Reference to Video","created_by":"fal","source":"official","description":"Turn up to five reference images into one continuous, consistent video with Bernini-R, with smooth, stable camera motion and no scene cuts.","status":"active","release_date":"2026-06-08","model_type":"video","page_url":"https://fal.run/fal-ai/bernini-r/reference-to-video","tagline":"Turn up to five reference images into one continuous, consistent video with Bernini-R, with smooth, stable camera motion and no scene cuts.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-09","last_updated":"2026-06-10"},{"id":"fal-ai/bernini-r/text-to-video","name":"Bernini-R Text to Video","created_by":"fal","source":"official","description":"Generate high-quality video from a text prompt with Bernini-R, ByteDance's unified video generation and editing model.","status":"active","release_date":"2026-06-08","model_type":"video","page_url":"https://fal.run/fal-ai/bernini-r/text-to-video","tagline":"Generate high-quality video from a text prompt with Bernini-R, ByteDance's unified video generation and editing model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-09","last_updated":"2026-06-10"},{"id":"fal-ai/birefnet/v2/video","name":"Birefnet","created_by":"fal","source":"official","description":"Video background removal version of bilateral reference framework (BiRefNet) for high-resolution dichotomous image segmentation (DIS)\n","status":"active","release_date":"2025-10-26","model_type":"other","page_url":"https://fal.run/fal-ai/birefnet/v2/video","tagline":"Video background removal version of bilateral reference framework (BiRefNet) for high-resolution dichotomous image segmentation (DIS)\n","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/birefnet/v2","name":"Birefnet Background Removal V2","created_by":"fal","source":"official","description":"bilateral reference framework (BiRefNet) for high-resolution dichotomous image segmentation (DIS)","status":"active","release_date":"2024-10-28","model_type":"image","page_url":"https://fal.run/fal-ai/birefnet/v2","tagline":"bilateral reference framework (BiRefNet) for high-resolution dichotomous image segmentation (DIS)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-13","last_updated":"2026-06-03"},{"id":"fal-ai/birefnet","name":"Birefnet Background Removal","created_by":"fal","source":"official","description":"bilateral reference framework (BiRefNet) for high-resolution dichotomous image segmentation (DIS)","status":"active","release_date":"2024-02-27","model_type":"image","page_url":"https://fal.run/fal-ai/birefnet","tagline":"bilateral reference framework (BiRefNet) for high-resolution dichotomous image segmentation (DIS)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-13","last_updated":"2026-06-03"},{"id":"fal-ai/bitdance","name":"Bitdance","created_by":"fal","source":"official","description":"Image generation with BitDance.","status":"active","release_date":"2026-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/bitdance","tagline":"Image generation with BitDance.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-02-21","last_updated":"2026-05-11"},{"id":"fal-ai/boogu-image/edit","name":"Boogu Image","created_by":"fal","source":"official","description":"Image To Image Model using Boogu-Image","status":"active","release_date":"2026-06-18","model_type":"image","page_url":"https://fal.run/fal-ai/boogu-image/edit","tagline":"Image To Image Model using Boogu-Image","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-18","last_updated":"2026-06-18"},{"id":"fal-ai/boogu-image","name":"Boogu Image","created_by":"fal","source":"official","description":"Text To Image Model using Boogu-Image","status":"active","release_date":"2026-06-18","model_type":"image","page_url":"https://fal.run/fal-ai/boogu-image","tagline":"Text To Image Model using Boogu-Image","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-18","last_updated":"2026-06-18"},{"id":"fal-ai/bria/background/remove","name":"Bria RMBG 2.0","created_by":"fal","source":"official","description":"Bria RMBG 2.0 enables seamless removal of backgrounds from images, ideal for professional editing tasks.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/background/remove","tagline":"Bria RMBG 2.0 enables seamless removal of backgrounds from images, ideal for professional editing tasks.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/bria/background/replace","name":"Bria Background Replace","created_by":"fal","source":"official","description":"Bria Background Replace allows for efficient swapping of backgrounds in images via text prompts or reference image, delivering realistic and polished results.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/background/replace","tagline":"Bria Background Replace allows for efficient swapping of backgrounds in images via text prompts or reference image, delivering realistic and polished results.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bria/eraser","name":"Bria Eraser","created_by":"fal","source":"official","description":"Bria Eraser enables precise removal of unwanted objects from images while maintaining high-quality outputs.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/eraser","tagline":"Bria Eraser enables precise removal of unwanted objects from images while maintaining high-quality outputs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bria/expand","name":"Bria Expand Image","created_by":"fal","source":"official","description":"Bria Expand expands images beyond their borders in high quality.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/expand","tagline":"Bria Expand expands images beyond their borders in high quality.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bria/genfill","name":"Bria GenFill","created_by":"fal","source":"official","description":"Bria GenFill enables high-quality object addition or visual transformation.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/genfill","tagline":"Bria GenFill enables high-quality object addition or visual transformation.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bria/product-shot","name":"Bria Product Shot","created_by":"fal","source":"official","description":"Place any product in any scenery with just a prompt or reference image while maintaining high integrity of the product.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/product-shot","tagline":"Place any product in any scenery with just a prompt or reference image while maintaining high integrity of the product.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bria/reimagine","name":"Bria","created_by":"fal","source":"official","description":"Structure Reference allows generating new images while preserving the structure of an input image, guided by text prompts.","status":"active","release_date":"2025-07-08","model_type":"image","page_url":"https://fal.run/fal-ai/bria/reimagine","tagline":"Structure Reference allows generating new images while preserving the structure of an input image, guided by text prompts.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/bria/text-to-image/base","name":"Bria Text-to-Image Base","created_by":"fal","source":"official","description":"Bria's Text-to-Image model, trained exclusively on licensed data for safe and risk-free commercial use.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/text-to-image/base","tagline":"Bria's Text-to-Image model, trained exclusively on licensed data for safe and risk-free commercial use.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bria/text-to-image/fast","name":"Bria Text-to-Image Fast","created_by":"fal","source":"official","description":"Bria's Text-to-Image model with perfect harmony of latency and quality.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/text-to-image/fast","tagline":"Bria's Text-to-Image model with perfect harmony of latency and quality.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bria/text-to-image/hd","name":"Bria Text-to-Image HD","created_by":"fal","source":"official","description":"Bria's Text-to-Image model for HD images.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/text-to-image/hd","tagline":"Bria's Text-to-Image model for HD images.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/dreamactor/v2","name":"Bytedance Dreamactor V2","created_by":"fal","source":"official","description":"Transfer motion from a video to characters in an image using Dreamactor v2.","status":"active","release_date":"2026-02-06","model_type":"other","page_url":"https://fal.run/fal-ai/bytedance/dreamactor/v2","tagline":"Transfer motion from a video to characters in an image using Dreamactor v2.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/dreamina/v3.1/text-to-image","name":"Bytedance Dreamina V3.1 Text To Image","created_by":"fal","source":"official","description":"Dreamina showcases superior picture effects, with significant improvements in picture aesthetics, precise and diverse styles, and rich details.","status":"active","release_date":"2025-08-06","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/dreamina/v3.1/text-to-image","tagline":"Dreamina showcases superior picture effects, with significant improvements in picture aesthetics, precise and diverse styles, and rich details.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/bytedance/omnihuman/v1.5","name":"Bytedance Omnihuman V1.5","created_by":"fal","source":"official","description":"Omnihuman v1.5 is a new and improved version of Omnihuman.","status":"active","release_date":"2025-09-23","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/omnihuman/v1.5","tagline":"Omnihuman v1.5 is a new and improved version of Omnihuman.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/omnihuman","name":"OmniHuman","created_by":"fal","source":"official","description":"OmniHuman generates video using an image of a human figure paired with an audio file.","status":"active","release_date":"2025-07-27","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/omnihuman","tagline":"OmniHuman generates video using an image of a human figure paired with an audio file.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/seed-speech/tts/v2","name":"Bytedance Seed Speech Text to Speech","created_by":"fal","source":"official","description":"Seed Speech developed by ByteDance, is a family of large-scale text-to-speech models capable of synthesizing speech that is virtually indistinguishable from human speech.","status":"active","release_date":"2026-06-05","model_type":"tts","page_url":"https://fal.run/fal-ai/bytedance/seed-speech/tts/v2","tagline":"Seed Speech developed by ByteDance, is a family of large-scale text-to-speech models capable of synthesizing speech that is virtually indistinguishable from human speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/bytedance/seed/v2/mini","name":"Bytedance Seed V2 Mini","created_by":"fal","source":"official","description":" Seed 2.0 Mini is a high-performance multimodal model optimized for low latency and high concurrency.","status":"active","release_date":"2026-03-17","model_type":"other","page_url":"https://fal.run/fal-ai/bytedance/seed/v2/mini","tagline":" Seed 2.0 Mini is a high-performance multimodal model optimized for low latency and high concurrency.","capabilities":{"vision":true,"reasoning":true},"last_seen_at":"2026-03-18","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedance/v1/lite/image-to-video","name":"Seedance 1.0 Lite","created_by":"fal","source":"official","description":"Seedance 1.0 Lite","status":"active","release_date":"2025-06-13","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1/lite/image-to-video","tagline":"Seedance 1.0 Lite","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/seedance/v1/lite/reference-to-video","name":"Bytedance","created_by":"fal","source":"official","description":"Seedance lite reference-to-video allows the use of 1 to 4 images as reference to create a high-quality video.","status":"active","release_date":"2025-09-01","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1/lite/reference-to-video","tagline":"Seedance lite reference-to-video allows the use of 1 to 4 images as reference to create a high-quality video.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/seedance/v1/lite/text-to-video","name":"Seedance 1.0 Lite","created_by":"fal","source":"official","description":"Seedance 1.0 Lite","status":"active","release_date":"2025-06-13","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1/lite/text-to-video","tagline":"Seedance 1.0 Lite","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/seedance/v1/pro/fast/image-to-video","name":"Bytedance Seedance V1 Pro Fast Image To Video","created_by":"fal","source":"official","description":"Image to Video endpoint for Seedance 1.0 Pro Fast, a next-generation video model designed to deliver maximum performance at minimal cost","status":"active","release_date":"2025-10-24","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1/pro/fast/image-to-video","tagline":"Image to Video endpoint for Seedance 1.0 Pro Fast, a next-generation video model designed to deliver maximum performance at minimal cost","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedance/v1/pro/fast/text-to-video","name":"Bytedance Seedance V1 Pro Fast Text To Video","created_by":"fal","source":"official","description":"Text to Video endpoint for Seedance 1.0 Pro Fast, a next-generation video model designed to deliver maximum performance at minimal cost","status":"active","release_date":"2025-10-24","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1/pro/fast/text-to-video","tagline":"Text to Video endpoint for Seedance 1.0 Pro Fast, a next-generation video model designed to deliver maximum performance at minimal cost","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedance/v1/pro/image-to-video","name":"Seedance 1.0 Pro","created_by":"fal","source":"official","description":"Seedance 1.0 Pro, a high quality video generation model developed by Bytedance.","status":"active","release_date":"2025-06-16","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1/pro/image-to-video","tagline":"Seedance 1.0 Pro, a high quality video generation model developed by Bytedance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/seedance/v1/pro/text-to-video","name":"Seedance 1.0 Pro","created_by":"fal","source":"official","description":"Seedance 1.0 Pro, a high quality video generation model developed by Bytedance.","status":"active","release_date":"2025-06-16","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1/pro/text-to-video","tagline":"Seedance 1.0 Pro, a high quality video generation model developed by Bytedance.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/seedance/v1.5/pro/image-to-video","name":"Bytedance Seedance V1.5 Pro Image To Video","created_by":"fal","source":"official","description":"Generate videos with audio with Seedance 1.5 (supports start & end frame) ","status":"active","release_date":"2025-12-23","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1.5/pro/image-to-video","tagline":"Generate videos with audio with Seedance 1.5 (supports start & end frame) ","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedance/v1.5/pro/text-to-video","name":"Bytedance Seedance V1.5 Pro Text To Video","created_by":"fal","source":"official","description":"Generate videos with audio with Seedance 1.5","status":"active","release_date":"2025-12-23","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1.5/pro/text-to-video","tagline":"Generate videos with audio with Seedance 1.5","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedream/v3/text-to-image","name":"Bytedance","created_by":"fal","source":"official","description":"Seedream 3.0 is a bilingual (Chinese and English) text-to-image model that excels at text-to-image generation.","status":"active","release_date":"2025-06-10","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/seedream/v3/text-to-image","tagline":"Seedream 3.0 is a bilingual (Chinese and English) text-to-image model that excels at text-to-image generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/seedream/v4/edit","name":"Bytedance Seedream V4 Edit","created_by":"fal","source":"official","description":"A new-generation image creation model ByteDance, Seedream 4.0 integrates image generation and image editing capabilities into a single, unified architecture.","status":"active","release_date":"2025-09-09","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/seedream/v4/edit","tagline":"A new-generation image creation model ByteDance, Seedream 4.0 integrates image generation and image editing capabilities into a single, unified architecture.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedream/v4/text-to-image","name":"Bytedance Seedream V4 Text To Image","created_by":"fal","source":"official","description":"A new-generation image creation model ByteDance, Seedream 4.0 integrates image generation and image editing capabilities into a single, unified architecture.","status":"active","release_date":"2025-09-09","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/seedream/v4/text-to-image","tagline":"A new-generation image creation model ByteDance, Seedream 4.0 integrates image generation and image editing capabilities into a single, unified architecture.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/bytedance/seedream/v4.5/edit","name":"Bytedance Seedream V4.5 Edit","created_by":"fal","source":"official","description":"A new-generation image creation model ByteDance, Seedream 4.5 integrates image generation and image editing capabilities into a single, unified architecture.","status":"active","release_date":"2025-12-03","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/seedream/v4.5/edit","tagline":"A new-generation image creation model ByteDance, Seedream 4.5 integrates image generation and image editing capabilities into a single, unified architecture.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedream/v4.5/text-to-image","name":"Bytedance Seedream V4.5 Text To Image","created_by":"fal","source":"official","description":"A new-generation image creation model ByteDance, Seedream 4.5 integrates image generation and image editing capabilities into a single, unified architecture.","status":"active","release_date":"2025-12-03","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/seedream/v4.5/text-to-image","tagline":"A new-generation image creation model ByteDance, Seedream 4.5 integrates image generation and image editing capabilities into a single, unified architecture.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedream/v5/lite/edit","name":"Bytedance Seedream V5 Lite Edit","created_by":"fal","source":"official","description":"Image editing endpoint for the fast Lite version of Seedream 5.0, supporting high quality intelligent image editing with multiple inputs.","status":"active","release_date":"2026-02-23","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/seedream/v5/lite/edit","tagline":"Image editing endpoint for the fast Lite version of Seedream 5.0, supporting high quality intelligent image editing with multiple inputs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-29","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedream/v5/lite/text-to-image","name":"Bytedance Seedream V5 Lite Text To Image","created_by":"fal","source":"official","description":"Text to Image endpoint for the fast Lite version of Seedream 5.0, supporting high quality intelligent text-to-image generation.","status":"active","release_date":"2026-02-23","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/seedream/v5/lite/text-to-image","tagline":"Text to Image endpoint for the fast Lite version of Seedream 5.0, supporting high quality intelligent text-to-image generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-27","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance-upscaler/upscale/video","name":"Bytedance Upscaler Upscale Video","created_by":"fal","source":"official","description":"Upscale videos with Bytedance's video upscaler.","status":"active","release_date":"2025-10-31","model_type":"other","page_url":"https://fal.run/fal-ai/bytedance-upscaler/upscale/video","tagline":"Upscale videos with Bytedance's video upscaler.","last_seen_at":"2026-04-28","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/video-stylize","name":"Bytedance","created_by":"fal","source":"official","description":"Transform your images into stylized videos using this workflow.","status":"active","release_date":"2025-08-12","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/video-stylize","tagline":"Transform your images into stylized videos using this workflow.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/calligrapher","name":"Calligrapher","created_by":"fal","source":"official","description":"Use the text and font retaining capabilities of calligrapher to modify texts on your books, clothes and many more.","status":"active","release_date":"2025-07-12","model_type":"image","page_url":"https://fal.run/fal-ai/calligrapher","tagline":"Use the text and font retaining capabilities of calligrapher to modify texts on your books, clothes and many more.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/cartoonify","name":"Cartoonify","created_by":"fal","source":"official","description":"Transform images into 3D cartoon artwork using an AI model that applies cartoon stylization while preserving the original image's composition and details.","status":"active","release_date":"2025-04-14","model_type":"image","page_url":"https://fal.run/fal-ai/cartoonify","tagline":"Transform images into 3D cartoon artwork using an AI model that applies cartoon stylization while preserving the original image's composition and details.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/cat-vton","name":"try-on","created_by":"fal","source":"official","description":"Image based high quality Virtual Try-On","status":"active","release_date":"2024-12-17","model_type":"image","page_url":"https://fal.run/fal-ai/cat-vton","tagline":"Image based high quality Virtual Try-On","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/ccsr","name":"CCSR Upscaler","created_by":"fal","source":"official","description":"SOTA Image Upscaler","status":"active","release_date":"2024-05-05","model_type":"image","page_url":"https://fal.run/fal-ai/ccsr","tagline":"SOTA Image Upscaler","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/chain-of-zoom","name":"Chain Of Zoom","created_by":"fal","source":"official","description":"Extreme Super-Resolution via Scale Autoregression and Preference Alignment","status":"active","release_date":"2025-06-18","model_type":"image","page_url":"https://fal.run/fal-ai/chain-of-zoom","tagline":"Extreme Super-Resolution via Scale Autoregression and Preference Alignment","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/chatterbox/speech-to-speech","name":"Chatterbox","created_by":"fal","source":"official","description":"Whether you're working on memes, videos, games, or AI agents, Chatterbox brings your content to life.","status":"active","release_date":"2025-06-01","model_type":"other","page_url":"https://fal.run/fal-ai/chatterbox/speech-to-speech","tagline":"Whether you're working on memes, videos, games, or AI agents, Chatterbox brings your content to life.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/chatterbox/text-to-speech/multilingual","name":"Chatterbox","created_by":"fal","source":"official","description":"Whether you're working on memes, videos, games, or AI agents, Chatterbox brings your content to life.","status":"active","release_date":"2025-09-04","model_type":"tts","page_url":"https://fal.run/fal-ai/chatterbox/text-to-speech/multilingual","tagline":"Whether you're working on memes, videos, games, or AI agents, Chatterbox brings your content to life.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/chatterbox/text-to-speech","name":"Chatterbox","created_by":"fal","source":"official","description":"Whether you're working on memes, videos, games, or AI agents, Chatterbox brings your content to life.","status":"active","release_date":"2025-06-01","model_type":"tts","page_url":"https://fal.run/fal-ai/chatterbox/text-to-speech","tagline":"Whether you're working on memes, videos, games, or AI agents, Chatterbox brings your content to life.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/chrono-edit-lora-gallery/paintbrush","name":"Chrono Edit Lora Gallery","created_by":"fal","source":"official","description":"You can make edits simply by drawing a quick sketch on the input image.","status":"active","release_date":"2025-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/chrono-edit-lora-gallery/paintbrush","tagline":"You can make edits simply by drawing a quick sketch on the input image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/chrono-edit-lora-gallery/upscaler","name":"Chrono Edit Lora Gallery","created_by":"fal","source":"official","description":"Upscales and cleans up the image.","status":"active","release_date":"2025-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/chrono-edit-lora-gallery/upscaler","tagline":"Upscales and cleans up the image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/chrono-edit-lora","name":"Chrono Edit Lora","created_by":"fal","source":"official","description":"LoRA endpoint for the Chrono Edit model.","status":"active","release_date":"2025-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/chrono-edit-lora","tagline":"LoRA endpoint for the Chrono Edit model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/chrono-edit","name":"Chrono Edit","created_by":"fal","source":"official","description":"NVIDIA's Logically Consistent and Physics-Aware Image Editing Model","status":"active","release_date":"2025-10-30","model_type":"image","page_url":"https://fal.run/fal-ai/chrono-edit","tagline":"NVIDIA's Logically Consistent and Physics-Aware Image Editing Model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/clarity-upscaler","name":"Clarity Upscaler","created_by":"fal","source":"official","description":"Clarity upscaler for upscaling images with high very fidelity.","status":"active","release_date":"2024-02-04","model_type":"image","page_url":"https://fal.run/fal-ai/clarity-upscaler","tagline":"Clarity upscaler for upscaling images with high very fidelity.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"fal-ai/codeformer","name":"CodeFormer","created_by":"fal","source":"official","description":"Fix distorted or blurred photos of people with CodeFormer.","status":"active","release_date":"2025-01-31","model_type":"image","page_url":"https://fal.run/fal-ai/codeformer","tagline":"Fix distorted or blurred photos of people with CodeFormer.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/cogvideox-5b/image-to-video","name":"CogVideoX-5B","created_by":"fal","source":"official","description":"Generate videos from images and prompts using CogVideoX-5B","status":"active","release_date":"2024-10-17","model_type":"video","page_url":"https://fal.run/fal-ai/cogvideox-5b/image-to-video","tagline":"Generate videos from images and prompts using CogVideoX-5B","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/cogvideox-5b/video-to-video","name":"CogVideoX-5B","created_by":"fal","source":"official","description":"Generate videos from videos and prompts using CogVideoX-5B","status":"active","release_date":"2024-10-17","model_type":"other","page_url":"https://fal.run/fal-ai/cogvideox-5b/video-to-video","tagline":"Generate videos from videos and prompts using CogVideoX-5B","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/cogvideox-5b","name":"CogVideoX-5B","created_by":"fal","source":"official","description":"Generate videos from prompts using CogVideoX-5B","status":"active","release_date":"2025-01-14","model_type":"video","parameters":5,"page_url":"https://fal.run/fal-ai/cogvideox-5b","tagline":"Generate videos from prompts using CogVideoX-5B","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/cogview4","name":"CogView","created_by":"fal","source":"official","description":"Generate high quality images from text prompts using CogView4.","status":"active","release_date":"2025-03-04","model_type":"image","page_url":"https://fal.run/fal-ai/cogview4","tagline":"Generate high quality images from text prompts using CogView4.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/cohere-transcribe","name":"Cohere Transcribe","created_by":"fal","source":"official","description":"Cohere Transcribe turns your business audio into accurate text, ready for search, analytics, and automation","status":"active","release_date":"2026-04-22","model_type":"transcription","page_url":"https://fal.run/fal-ai/cohere-transcribe","tagline":"Cohere Transcribe turns your business audio into accurate text, ready for search, analytics, and automation","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-05-12","last_updated":"2026-06-03"},{"id":"fal-ai/control-light","name":"ControlLight","created_by":"fal","source":"official","description":"ControlLight is a LoRA fine-tune of FLUX.2 [klein] 9B that enhances low-light images while preserving scene structure and fine details, with a single alpha parameter that gives continuous control over","status":"active","release_date":"2026-05-27","model_type":"image","page_url":"https://fal.run/fal-ai/control-light","tagline":"ControlLight is a LoRA fine-tune of FLUX.2 [klein] 9B that enhances low-light images while preserving scene structure and fine details, with a single alpha parameter that gives continuous control over","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-29","last_updated":"2026-06-03"},{"id":"fal-ai/controlfoley","name":"Controlfoley","created_by":"fal","source":"official","description":"Foley Control is a video-to-audio model that automatically generates synchronized sound effects for videos, using text prompts to shape the type of sound while matching the timing and action on screen","status":"active","release_date":"2026-05-05","model_type":"other","page_url":"https://fal.run/fal-ai/controlfoley","tagline":"Foley Control is a video-to-audio model that automatically generates synchronized sound effects for videos, using text prompts to shape the type of sound while matching the timing and action on screen","last_seen_at":"2026-05-22","last_updated":"2026-06-03"},{"id":"fal-ai/controlnext","name":"ControlNeXt SVD","created_by":"fal","source":"official","description":"Animate a reference image with a driving video using ControlNeXt.","status":"active","release_date":"2024-09-05","model_type":"other","page_url":"https://fal.run/fal-ai/controlnext","tagline":"Animate a reference image with a driving video using ControlNeXt.","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/cosmos-predict-2.5/distilled/text-to-video","name":"Cosmos Predict 2.5 2B Distilled","created_by":"fal","source":"official","description":"Generate video from text and videos using NVIDIA's 2B Cosmos Distilled Model","status":"active","release_date":"2026-02-24","model_type":"video","page_url":"https://fal.run/fal-ai/cosmos-predict-2.5/distilled/text-to-video","tagline":"Generate video from text and videos using NVIDIA's 2B Cosmos Distilled Model","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/cosmos-predict-2.5/image-to-video","name":"Cosmos Predict 2.5 2B","created_by":"fal","source":"official","description":"Generate video from text and images using NVIDIA's 2B Cosmos Post-Trained Model","status":"active","release_date":"2026-02-24","model_type":"video","page_url":"https://fal.run/fal-ai/cosmos-predict-2.5/image-to-video","tagline":"Generate video from text and images using NVIDIA's 2B Cosmos Post-Trained Model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/cosmos-predict-2.5/text-to-video","name":"Cosmos Predict 2.5 2B","created_by":"fal","source":"official","description":"Generate video from text using NVIDIA's 2B Cosmos Post-Trained Model","status":"active","release_date":"2026-02-24","model_type":"video","page_url":"https://fal.run/fal-ai/cosmos-predict-2.5/text-to-video","tagline":"Generate video from text using NVIDIA's 2B Cosmos Post-Trained Model","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/cosmos-predict-2.5/video-to-video","name":"Cosmos Predict 2.5 2B","created_by":"fal","source":"official","description":"Generate video from text and videos using NVIDIA's 2B Cosmos Post-Trained Model","status":"active","release_date":"2026-02-24","model_type":"other","page_url":"https://fal.run/fal-ai/cosmos-predict-2.5/video-to-video","tagline":"Generate video from text and videos using NVIDIA's 2B Cosmos Post-Trained Model","last_seen_at":"2026-02-24","last_updated":"2026-05-11"},{"id":"fal-ai/creatify/aurora","name":"Creatify Aurora","created_by":"fal","source":"official","description":"Generate high fidelity, studio quality videos of your avatar speaking or singing using the Aurora from Creatify team!","status":"active","release_date":"2025-12-11","model_type":"video","page_url":"https://fal.run/fal-ai/creatify/aurora","tagline":"Generate high fidelity, studio quality videos of your avatar speaking or singing using the Aurora from Creatify team!","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/creative-upscaler","name":"Creative Upscaler","created_by":"fal","source":"official","description":"Create creative upscaled images.","status":"active","release_date":"2024-02-27","model_type":"image","page_url":"https://fal.run/fal-ai/creative-upscaler","tagline":"Create creative upscaled images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/csm-1b","name":"CSM-1B","created_by":"fal","source":"official","description":"CSM (Conversational Speech Model) is a speech generation model from Sesame that generates RVQ audio codes from text and audio inputs.","status":"active","release_date":"2025-03-13","model_type":"other","parameters":1,"page_url":"https://fal.run/fal-ai/csm-1b","tagline":"CSM (Conversational Speech Model) is a speech generation model from Sesame that generates RVQ audio codes from text and audio inputs.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/davinci-magihuman","name":"Davinci Magihuman","created_by":"fal","source":"official","description":"Expressive facial performance, natural speech-expression coordination, realistic body motion, and accurate audio-video synchronization with DaVinci-MagiHuman model","status":"active","release_date":"2026-03-25","model_type":"video","page_url":"https://fal.run/fal-ai/davinci-magihuman","tagline":"Expressive facial performance, natural speech-expression coordination, realistic body motion, and accurate audio-video synchronization with DaVinci-MagiHuman model","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/ddcolor","name":"DDColor","created_by":"fal","source":"official","description":"Bring colors into old or new black and white photos with DDColor.","status":"active","release_date":"2025-02-26","model_type":"image","page_url":"https://fal.run/fal-ai/ddcolor","tagline":"Bring colors into old or new black and white photos with DDColor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/decart/lucy-5b/image-to-video","name":"Decart","created_by":"fal","source":"official","description":"Lucy-5B is a model that can create 5-second I2V videos in under 5 seconds, achieving >1x RTF end-to-end","status":"active","release_date":"2025-08-28","model_type":"video","page_url":"https://fal.run/fal-ai/decart/lucy-5b/image-to-video","tagline":"Lucy-5B is a model that can create 5-second I2V videos in under 5 seconds, achieving >1x RTF end-to-end","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/deepfilternet3","name":"DeepFilterNet 3","created_by":"fal","source":"official","description":"Enhance speech audio by removing background noise and upsampling to 48KHz","status":"active","release_date":"2026-01-07","model_type":"other","page_url":"https://fal.run/fal-ai/deepfilternet3","tagline":"Enhance speech audio by removing background noise and upsampling to 48KHz","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/demucs","name":"Demucs","created_by":"fal","source":"official","description":"SOTA stemming model for voice, drums, bass, guitar and more.","status":"active","release_date":"2025-10-27","model_type":"other","page_url":"https://fal.run/fal-ai/demucs","tagline":"SOTA stemming model for voice, drums, bass, guitar and more.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/depth-anything-video","name":"Depth Anything Video","created_by":"fal","source":"official","description":"Generates depth maps from video using Video Depth Anything (CVPR 2025).","status":"active","release_date":"2026-03-02","model_type":"other","page_url":"https://fal.run/fal-ai/depth-anything-video","tagline":"Generates depth maps from video using Video Depth Anything (CVPR 2025).","last_seen_at":"2026-03-02","last_updated":"2026-05-11"},{"id":"fal-ai/dia-tts/voice-clone","name":"Dia Tts","created_by":"fal","source":"official","description":"Clone dialog voices from a sample audio and generate dialogs from text prompts using the Dia TTS which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-04-22","model_type":"other","page_url":"https://fal.run/fal-ai/dia-tts/voice-clone","tagline":"Clone dialog voices from a sample audio and generate dialogs from text prompts using the Dia TTS which leverages advanced AI techniques to create high-quality text-to-speech.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/dia-tts","name":"Dia","created_by":"fal","source":"official","description":"Dia directly generates realistic dialogue from transcripts.","status":"active","release_date":"2025-04-22","model_type":"tts","page_url":"https://fal.run/fal-ai/dia-tts","tagline":"Dia directly generates realistic dialogue from transcripts.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/diffrhythm","name":"DiffRhythm: Lyrics to Song","created_by":"fal","source":"official","description":"DiffRhythm is a blazing fast model for transforming lyrics into full songs.","status":"active","release_date":"2025-03-04","model_type":"other","page_url":"https://fal.run/fal-ai/diffrhythm","tagline":"DiffRhythm is a blazing fast model for transforming lyrics into full songs.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/diffusion-edge","name":"DiffusionEdge","created_by":"fal","source":"official","description":"Diffusion based high quality edge detection","status":"active","release_date":"2024-01-08","model_type":"image","page_url":"https://fal.run/fal-ai/diffusion-edge","tagline":"Diffusion based high quality edge detection","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/docres/dewarp","name":"DocRes-dewarp","created_by":"fal","source":"official","description":"Enhance wraped, folded documents with the superior quality of docres for sharper, clearer results.","status":"active","release_date":"2025-03-03","model_type":"image","page_url":"https://fal.run/fal-ai/docres/dewarp","tagline":"Enhance wraped, folded documents with the superior quality of docres for sharper, clearer results.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/docres","name":"DocRes","created_by":"fal","source":"official","description":"Enhance low-resolution, blur, shadowed documents with the superior quality of docres for sharper, clearer results.","status":"active","release_date":"2025-03-03","model_type":"image","page_url":"https://fal.run/fal-ai/docres","tagline":"Enhance low-resolution, blur, shadowed documents with the superior quality of docres for sharper, clearer results.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/drct-super-resolution","name":"DRCT-Super-Resolution","created_by":"fal","source":"official","description":"Upscale your images with DRCT-Super-Resolution.","status":"active","release_date":"2025-02-24","model_type":"image","page_url":"https://fal.run/fal-ai/drct-super-resolution","tagline":"Upscale your images with DRCT-Super-Resolution.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/dreamo","name":"DreamO","created_by":"fal","source":"official","description":"DreamO is an image customization framework designed to support a wide range of tasks while facilitating seamless integration of multiple conditions.","status":"active","release_date":"2025-05-19","model_type":"image","page_url":"https://fal.run/fal-ai/dreamo","tagline":"DreamO is an image customization framework designed to support a wide range of tasks while facilitating seamless integration of multiple conditions.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/dreamomni2/edit","name":"DreamOmni2","created_by":"fal","source":"official","description":"DreamOmni2 is a unified multimodal model for text and image guided image editing.","status":"active","release_date":"2025-10-10","model_type":"image","page_url":"https://fal.run/fal-ai/dreamomni2/edit","tagline":"DreamOmni2 is a unified multimodal model for text and image guided image editing.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/dreamshaper","name":"Dreamshaper","created_by":"fal","source":"official","description":"Dreamshaper model.","status":"active","release_date":"2024-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/dreamshaper","tagline":"Dreamshaper model.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/dubbing","name":"Dubbing","created_by":"fal","source":"official","description":"This endpoint delivers seamlessly localized videos by generating lip-synced dubs in multiple languages, ensuring natural and immersive multilingual experiences","status":"active","release_date":"2024-12-20","model_type":"other","page_url":"https://fal.run/fal-ai/dubbing","tagline":"This endpoint delivers seamlessly localized videos by generating lip-synced dubs in multiple languages, ensuring natural and immersive multilingual experiences","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/dwpose/video","name":"DWPose Pose Prediction","created_by":"fal","source":"official","description":"Predict poses from videos.","status":"active","release_date":"2025-06-15","model_type":"other","page_url":"https://fal.run/fal-ai/dwpose/video","tagline":"Predict poses from videos.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/dwpose","name":"DWPose Pose Prediction","created_by":"fal","source":"official","description":"Predict poses from images.","status":"active","release_date":"2024-06-01","model_type":"image","page_url":"https://fal.run/fal-ai/dwpose","tagline":"Predict poses from images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/echomimic-v3","name":"EchoMimic V3","created_by":"fal","source":"official","description":"EchoMimic V3 generates a talking avatar model from a picture, audio and text prompt.","status":"active","release_date":"2025-08-13","model_type":"other","page_url":"https://fal.run/fal-ai/echomimic-v3","tagline":"EchoMimic V3 generates a talking avatar model from a picture, audio and text prompt.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/editto","name":"Editto","created_by":"fal","source":"official","description":"Edit videos using instruction-based prompting using Editto model!","status":"active","release_date":"2025-11-12","model_type":"other","page_url":"https://fal.run/fal-ai/editto","tagline":"Edit videos using instruction-based prompting using Editto model!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/elevenlabs/audio-isolation","name":"ElevenLabs Audio Isolation","created_by":"fal","source":"official","description":"Isolate audio tracks using ElevenLabs advanced audio isolation technology.","status":"active","release_date":"2025-02-27","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/audio-isolation","tagline":"Isolate audio tracks using ElevenLabs advanced audio isolation technology.","capabilities":{"streaming":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/elevenlabs/dubbing","name":"ElevenLabs Dubbing","created_by":"fal","source":"official","description":"Generate dubbed videos or audios using ElevenLabs Dubbing feature!","status":"active","release_date":"2026-01-14","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/dubbing","tagline":"Generate dubbed videos or audios using ElevenLabs Dubbing feature!","last_seen_at":"2026-05-27","last_updated":"2026-06-03"},{"id":"fal-ai/elevenlabs/music","name":"Elevenlabs Music","created_by":"fal","source":"official","description":"Generate high quality, realistic music with fine controls using Elevenlabs Music!","status":"active","release_date":"2025-12-22","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/music","tagline":"Generate high quality, realistic music with fine controls using Elevenlabs Music!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/elevenlabs/sound-effects/v2","name":"Elevenlabs Sound Effects V2","created_by":"fal","source":"official","description":"Generate sound effects using ElevenLabs advanced sound effects model.","status":"active","release_date":"2025-09-02","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/sound-effects/v2","tagline":"Generate sound effects using ElevenLabs advanced sound effects model.","capabilities":{"streaming":true},"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/elevenlabs/speech-to-text/scribe-v2","name":"ElevenLabs Speech to Text - Scribe V2","created_by":"fal","source":"official","description":"Use Scribe-V2 from ElevenLabs to do blazingly fast speech to text inferences!","status":"active","release_date":"2026-01-14","model_type":"transcription","page_url":"https://fal.run/fal-ai/elevenlabs/speech-to-text/scribe-v2","tagline":"Use Scribe-V2 from ElevenLabs to do blazingly fast speech to text inferences!","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/elevenlabs/speech-to-text","name":"ElevenLabs Speech to Text","created_by":"fal","source":"official","description":"Generate text from speech using ElevenLabs advanced speech-to-text model.","status":"active","release_date":"2025-02-27","model_type":"transcription","page_url":"https://fal.run/fal-ai/elevenlabs/speech-to-text","tagline":"Generate text from speech using ElevenLabs advanced speech-to-text model.","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/elevenlabs/text-to-dialogue/eleven-v3","name":"Elevenlabs","created_by":"fal","source":"official","description":"Generate realistic audio dialogues using Eleven-v3 from ElevenLabs.","status":"active","release_date":"2025-09-09","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/text-to-dialogue/eleven-v3","tagline":"Generate realistic audio dialogues using Eleven-v3 from ElevenLabs.","capabilities":{"streaming":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/elevenlabs/tts/eleven-v3","name":"Elevenlabs Tts Eleven V3","created_by":"fal","source":"official","description":"Generate text-to-speech audio using Eleven-v3 from ElevenLabs.","status":"active","release_date":"2025-08-20","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/tts/eleven-v3","tagline":"Generate text-to-speech audio using Eleven-v3 from ElevenLabs.","capabilities":{"streaming":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/elevenlabs/tts/multilingual-v2","name":"ElevenLabs TTS Multilingual v2","created_by":"fal","source":"official","description":"Generate multilingual text-to-speech audio using ElevenLabs TTS Multilingual v2.","status":"active","release_date":"2025-02-27","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/tts/multilingual-v2","tagline":"Generate multilingual text-to-speech audio using ElevenLabs TTS Multilingual v2.","capabilities":{"streaming":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/elevenlabs/tts/turbo-v2.5","name":"ElevenLabs TTS Turbo v2.5","created_by":"fal","source":"official","description":"Generate high-speed text-to-speech audio using ElevenLabs TTS Turbo v2.5.","status":"active","release_date":"2025-02-27","model_type":"tts","page_url":"https://fal.run/fal-ai/elevenlabs/tts/turbo-v2.5","tagline":"Generate high-speed text-to-speech audio using ElevenLabs TTS Turbo v2.5.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/elevenlabs/voice-changer","name":"ElevenLabs Voice Changer","created_by":"fal","source":"official","description":"Change the voices in your audios with voices in ElevenLabs!","status":"active","release_date":"2026-01-14","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/voice-changer","tagline":"Change the voices in your audios with voices in ElevenLabs!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/emu-3.5-image/edit-image","name":"Emu 3.5 Image","created_by":"fal","source":"official","description":"Edit images with a text prompt using Emu 3.5 Image","status":"active","release_date":"2025-11-01","model_type":"image","page_url":"https://fal.run/fal-ai/emu-3.5-image/edit-image","tagline":"Edit images with a text prompt using Emu 3.5 Image","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/emu-3.5-image/text-to-image","name":"Emu 3.5 Image","created_by":"fal","source":"official","description":"Generate images from text using Emu 3.5 Image","status":"active","release_date":"2025-11-01","model_type":"image","page_url":"https://fal.run/fal-ai/emu-3.5-image/text-to-image","tagline":"Generate images from text using Emu 3.5 Image","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/era-3d","name":"Era 3D","created_by":"fal","source":"official","description":"A powerful image to novel multiview model with normals.","status":"active","release_date":"2024-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/era-3d","tagline":"A powerful image to novel multiview model with normals.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/ernie-image/lora/turbo","name":"Ernie Image Lora Turbo","created_by":"fal","source":"official","description":"High-quality text-to-image model by Baidu.","status":"active","release_date":"2026-04-16","model_type":"image","page_url":"https://fal.run/fal-ai/ernie-image/lora/turbo","tagline":"High-quality text-to-image model by Baidu.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/ernie-image/lora","name":"Ernie Image Lora","created_by":"fal","source":"official","description":"High-quality text-to-image model by Baidu.","status":"active","release_date":"2026-04-16","model_type":"image","page_url":"https://fal.run/fal-ai/ernie-image/lora","tagline":"High-quality text-to-image model by Baidu.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/ernie-image-trainer","name":"ERNIE-Image Trainer","created_by":"fal","source":"official","description":"LoRA trainer for ERNIE-Image, Baidu's powerful 8B-parameter text-to-image model.","status":"active","release_date":"2026-04-15","model_type":"other","page_url":"https://fal.run/fal-ai/ernie-image-trainer","tagline":"LoRA trainer for ERNIE-Image, Baidu's powerful 8B-parameter text-to-image model.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ernie-image/turbo","name":"Ernie Image Turbo","created_by":"fal","source":"official","description":"High-quality text-to-image model by Baidu.","status":"active","release_date":"2026-04-13","model_type":"image","page_url":"https://fal.run/fal-ai/ernie-image/turbo","tagline":"High-quality text-to-image model by Baidu.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/ernie-image","name":"Ernie Image","created_by":"fal","source":"official","description":"High-quality text-to-image model by Baidu.","status":"active","release_date":"2026-04-10","model_type":"image","page_url":"https://fal.run/fal-ai/ernie-image","tagline":"High-quality text-to-image model by Baidu.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-16","last_updated":"2026-06-03"},{"id":"fal-ai/esrgan","name":"Upscale Images","created_by":"fal","source":"official","description":"Upscale images by a given factor.","status":"active","release_date":"2023-10-30","model_type":"image","page_url":"https://fal.run/fal-ai/esrgan","tagline":"Upscale images by a given factor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/evf-sam","name":"EVF-SAM2 Segmentation","created_by":"fal","source":"official","description":"EVF-SAM2 combines natural language understanding with advanced segmentation capabilities, allowing you to precisely mask image regions using intuitive positive and negative text prompts.","status":"active","release_date":"2025-02-26","model_type":"image","page_url":"https://fal.run/fal-ai/evf-sam","tagline":"EVF-SAM2 combines natural language understanding with advanced segmentation capabilities, allowing you to precisely mask image regions using intuitive positive and negative text prompts.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/f-lite/standard","name":"F Lite","created_by":"fal","source":"official","description":"F Lite is a 10B parameter diffusion model created by Fal and Freepik, trained exclusively on copyright-safe and SFW content.","status":"active","release_date":"2025-04-28","model_type":"image","page_url":"https://fal.run/fal-ai/f-lite/standard","tagline":"F Lite is a 10B parameter diffusion model created by Fal and Freepik, trained exclusively on copyright-safe and SFW content.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/f-lite/texture","name":"F Lite (texture mode)","created_by":"fal","source":"official","description":"F Lite is a 10B parameter diffusion model created by Fal and Freepik, trained exclusively on copyright-safe and SFW content.","status":"active","release_date":"2025-04-28","model_type":"image","page_url":"https://fal.run/fal-ai/f-lite/texture","tagline":"F Lite is a 10B parameter diffusion model created by Fal and Freepik, trained exclusively on copyright-safe and SFW content.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/f5-tts","name":"F5 TTS","created_by":"fal","source":"official","description":"F5 TTS","status":"active","release_date":"2024-10-17","model_type":"other","page_url":"https://fal.run/fal-ai/f5-tts","tagline":"F5 TTS","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/face-to-sticker","name":"Face to Sticker","created_by":"fal","source":"official","description":"Create stickers from faces.","status":"active","release_date":"2024-03-11","model_type":"image","page_url":"https://fal.run/fal-ai/face-to-sticker","tagline":"Create stickers from faces.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/fashn/tryon/v1.5","name":"FASHN Virtual Try-On V1.5","created_by":"fal","source":"official","description":"FASHN v1.5 delivers precise virtual try-on capabilities, accurately rendering garment details like text and patterns at 576x864 resolution from both on-model and flat-lay photo references.","status":"active","release_date":"2025-04-21","model_type":"image","page_url":"https://fal.run/fal-ai/fashn/tryon/v1.5","tagline":"FASHN v1.5 delivers precise virtual try-on capabilities, accurately rendering garment details like text and patterns at 576x864 resolution from both on-model and flat-lay photo references.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fashn/tryon/v1.6","name":"FASHN Virtual Try-On V1.6","created_by":"fal","source":"official","description":"FASHN v1.6 delivers precise virtual try-on capabilities, accurately rendering garment details like text and patterns at 864x1296 resolution from both on-model and flat-lay photo references.","status":"active","release_date":"2025-06-24","model_type":"image","page_url":"https://fal.run/fal-ai/fashn/tryon/v1.6","tagline":"FASHN v1.6 delivers precise virtual try-on capabilities, accurately rendering garment details like text and patterns at 864x1296 resolution from both on-model and flat-lay photo references.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-animatediff/text-to-video","name":"AnimateDiff","created_by":"fal","source":"official","description":"Animate your ideas!","status":"active","release_date":"2024-02-21","model_type":"video","page_url":"https://fal.run/fal-ai/fast-animatediff/text-to-video","tagline":"Animate your ideas!","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-animatediff/turbo/text-to-video","name":"AnimateDiff Turbo","created_by":"fal","source":"official","description":"Animate your ideas in lightning speed!","status":"active","release_date":"2024-02-13","model_type":"video","page_url":"https://fal.run/fal-ai/fast-animatediff/turbo/text-to-video","tagline":"Animate your ideas in lightning speed!","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-animatediff/turbo/video-to-video","name":"AnimateDiff Turbo","created_by":"fal","source":"official","description":"Re-animate your videos in lightning speed!","status":"active","release_date":"2024-02-13","model_type":"other","page_url":"https://fal.run/fal-ai/fast-animatediff/turbo/video-to-video","tagline":"Re-animate your videos in lightning speed!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-animatediff/video-to-video","name":"AnimateDiff","created_by":"fal","source":"official","description":"Re-animate your videos!","status":"active","release_date":"2024-02-13","model_type":"other","page_url":"https://fal.run/fal-ai/fast-animatediff/video-to-video","tagline":"Re-animate your videos!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-fooocus-sdxl/image-to-image","name":"Fooocus","created_by":"fal","source":"official","description":"Fooocus extreme speed mode as a standalone app.","status":"active","release_date":"2024-03-13","model_type":"image","page_url":"https://fal.run/fal-ai/fast-fooocus-sdxl/image-to-image","tagline":"Fooocus extreme speed mode as a standalone app.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/fast-fooocus-sdxl","name":"Fooocus","created_by":"fal","source":"official","description":"Fooocus extreme speed mode as a standalone app.","status":"active","release_date":"2024-02-16","model_type":"image","page_url":"https://fal.run/fal-ai/fast-fooocus-sdxl","tagline":"Fooocus extreme speed mode as a standalone app.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/fast-lcm-diffusion/image-to-image","name":"Latent Consistency Models (v1.5/XL)","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-02-19","model_type":"image","page_url":"https://fal.run/fal-ai/fast-lcm-diffusion/image-to-image","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/fast-lcm-diffusion/inpainting","name":"Latent Consistency Models (v1.5/XL)","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-02-19","model_type":"image","page_url":"https://fal.run/fal-ai/fast-lcm-diffusion/inpainting","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/fast-lcm-diffusion","name":"Latent Consistency Models (v1.5/XL)","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-02-19","model_type":"image","page_url":"https://fal.run/fal-ai/fast-lcm-diffusion","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/fast-lightning-sdxl/image-to-image","name":"Stable Diffusion XL Lightning","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/fast-lightning-sdxl/image-to-image","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-lightning-sdxl/inpainting","name":"Stable Diffusion XL Lightning","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/fast-lightning-sdxl/inpainting","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-lightning-sdxl","name":"Stable Diffusion XL Lightning","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-04-11","model_type":"image","page_url":"https://fal.run/fal-ai/fast-lightning-sdxl","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-sdxl-controlnet-canny/image-to-image","name":"ControlNet SDXL","created_by":"fal","source":"official","description":"Generate Images with ControlNet.","status":"active","release_date":"2023-12-01","model_type":"image","page_url":"https://fal.run/fal-ai/fast-sdxl-controlnet-canny/image-to-image","tagline":"Generate Images with ControlNet.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/fast-sdxl-controlnet-canny/inpainting","name":"ControlNet SDXL","created_by":"fal","source":"official","description":"Generate Images with ControlNet.","status":"active","release_date":"2023-12-01","model_type":"image","page_url":"https://fal.run/fal-ai/fast-sdxl-controlnet-canny/inpainting","tagline":"Generate Images with ControlNet.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/fast-sdxl-controlnet-canny","name":"ControlNet SDXL","created_by":"fal","source":"official","description":"Generate Images with ControlNet.","status":"active","release_date":"2024-02-28","model_type":"image","page_url":"https://fal.run/fal-ai/fast-sdxl-controlnet-canny","tagline":"Generate Images with ControlNet.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/fast-sdxl/image-to-image","name":"Stable Diffusion XL","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-04-16","model_type":"image","page_url":"https://fal.run/fal-ai/fast-sdxl/image-to-image","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-sdxl/inpainting","name":"Stable Diffusion XL","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-04-16","model_type":"image","page_url":"https://fal.run/fal-ai/fast-sdxl/inpainting","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-sdxl","name":"Stable Diffusion XL","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-06-12","model_type":"image","page_url":"https://fal.run/fal-ai/fast-sdxl","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-svd-lcm/text-to-video","name":"Stable Video Diffusion Turbo","created_by":"fal","source":"official","description":"Generate short video clips from your images using SVD v1.1 at Lightning Speed","status":"active","release_date":"2024-06-03","model_type":"video","page_url":"https://fal.run/fal-ai/fast-svd-lcm/text-to-video","tagline":"Generate short video clips from your images using SVD v1.1 at Lightning Speed","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-svd-lcm","name":"Stable Video Diffusion Turbo","created_by":"fal","source":"official","description":"Generate short video clips from your images using SVD v1.1 at Lightning Speed","status":"active","release_date":"2024-02-13","model_type":"video","page_url":"https://fal.run/fal-ai/fast-svd-lcm","tagline":"Generate short video clips from your images using SVD v1.1 at Lightning Speed","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-svd/text-to-video","name":"Stable Video Diffusion","created_by":"fal","source":"official","description":"Generate short video clips from your prompts using SVD v1.1","status":"active","release_date":"2024-09-16","model_type":"video","page_url":"https://fal.run/fal-ai/fast-svd/text-to-video","tagline":"Generate short video clips from your prompts using SVD v1.1","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/compose","name":"FFmpeg API Compose","created_by":"fal","source":"official","description":"Compose videos from multiple media sources using FFmpeg API.","status":"active","release_date":"2025-01-22","model_type":"other","page_url":"https://fal.run/fal-ai/ffmpeg-api/compose","tagline":"Compose videos from multiple media sources using FFmpeg API.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/extract-frame","name":"Ffmpeg Api","created_by":"fal","source":"official","description":"ffmpeg endpoint for first, middle and last frame extraction from videos","status":"active","release_date":"2025-06-09","model_type":"image","page_url":"https://fal.run/fal-ai/ffmpeg-api/extract-frame","tagline":"ffmpeg endpoint for first, middle and last frame extraction from videos","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/images-to-video","name":"Ffmpeg Api Images to Video","created_by":"fal","source":"official","description":"A fal.ai endpoint that stitches an ordered list of images into an MP4 video by holding each image for a specified number of frames at a configurable frame rate","status":"active","release_date":"2026-05-05","model_type":"video","page_url":"https://fal.run/fal-ai/ffmpeg-api/images-to-video","tagline":"A fal.ai endpoint that stitches an ordered list of images into an MP4 video by holding each image for a specified number of frames at a configurable frame rate","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-05-05","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/loudnorm","name":"Ffmpeg Api","created_by":"fal","source":"official","description":"Get EBU R128 loudness normalization from audio files using FFmpeg API.","status":"active","release_date":"2025-07-08","model_type":"other","page_url":"https://fal.run/fal-ai/ffmpeg-api/loudnorm","tagline":"Get EBU R128 loudness normalization from audio files using FFmpeg API.","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/merge-audio-video","name":"Ffmpeg Api Merge Audio-Video","created_by":"fal","source":"official","description":"Merge videos with standalone audio files or audio from video files.","status":"active","release_date":"2025-06-09","model_type":"other","page_url":"https://fal.run/fal-ai/ffmpeg-api/merge-audio-video","tagline":"Merge videos with standalone audio files or audio from video files.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/merge-audios","name":"FFmpeg API [Merge Audios]","created_by":"fal","source":"official","description":"Merge audios into a single audio using FFmpeg API!","status":"active","release_date":"2025-12-23","model_type":"other","page_url":"https://fal.run/fal-ai/ffmpeg-api/merge-audios","tagline":"Merge audios into a single audio using FFmpeg API!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/merge-videos","name":"Ffmpeg Api","created_by":"fal","source":"official","description":"Use ffmpeg capabilities to merge 2 or more videos.","status":"active","release_date":"2025-08-12","model_type":"other","page_url":"https://fal.run/fal-ai/ffmpeg-api/merge-videos","tagline":"Use ffmpeg capabilities to merge 2 or more videos.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ffmpeg-api/metadata","name":"FFmpeg API Metadata","created_by":"fal","source":"official","description":"Get encoding metadata from video and audio files using FFmpeg API.","status":"active","release_date":"2025-01-22","model_type":"other","page_url":"https://fal.run/fal-ai/ffmpeg-api/metadata","tagline":"Get encoding metadata from video and audio files using FFmpeg API.","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/waveform","name":"FFmpeg API Waveform","created_by":"fal","source":"official","description":"Get waveform data from audio files using FFmpeg API.","status":"active","release_date":"2025-01-22","model_type":"other","page_url":"https://fal.run/fal-ai/ffmpeg-api/waveform","tagline":"Get waveform data from audio files using FFmpeg API.","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/film/video","name":"FILM","created_by":"fal","source":"official","description":"Interpolate videos with FILM - Frame Interpolation for Large Motion","status":"active","release_date":"2025-07-22","model_type":"other","page_url":"https://fal.run/fal-ai/film/video","tagline":"Interpolate videos with FILM - Frame Interpolation for Large Motion","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/film","name":"FILM","created_by":"fal","source":"official","description":"Interpolate images with FILM - Frame Interpolation for Large Motion","status":"active","release_date":"2025-07-22","model_type":"image","page_url":"https://fal.run/fal-ai/film","tagline":"Interpolate images with FILM - Frame Interpolation for Large Motion","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/finegrain-eraser/bbox","name":"Finegrain Eraser Bbox","created_by":"fal","source":"official","description":"Finegrain Eraser removes any object selected with a bounding box—along with its shadows, reflections, and lighting artifacts—seamlessly reconstructing the scene with contextually accurate content.","status":"active","release_date":"2025-04-09","model_type":"image","page_url":"https://fal.run/fal-ai/finegrain-eraser/bbox","tagline":"Finegrain Eraser removes any object selected with a bounding box—along with its shadows, reflections, and lighting artifacts—seamlessly reconstructing the scene with contextually accurate content.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/finegrain-eraser/mask","name":"Finegrain Eraser Mask","created_by":"fal","source":"official","description":"Finegrain Eraser removes any object selected with a mask—along with its shadows, reflections, and lighting artifacts—seamlessly reconstructing the scene with contextually accurate content.","status":"active","release_date":"2025-04-10","model_type":"image","page_url":"https://fal.run/fal-ai/finegrain-eraser/mask","tagline":"Finegrain Eraser removes any object selected with a mask—along with its shadows, reflections, and lighting artifacts—seamlessly reconstructing the scene with contextually accurate content.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/finegrain-eraser","name":"Finegrain Eraser","created_by":"fal","source":"official","description":"Finegrain Eraser removes objects—along with their shadows, reflections, and lighting artifacts—using only natural language, seamlessly filling the scene with contextually accurate content.","status":"active","release_date":"2025-04-09","model_type":"image","page_url":"https://fal.run/fal-ai/finegrain-eraser","tagline":"Finegrain Eraser removes objects—along with their shadows, reflections, and lighting artifacts—using only natural language, seamlessly filling the scene with contextually accurate content.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/firered-image-edit-v1.1","name":"Firered Image Edit V1.1","created_by":"fal","source":"official","description":"FireRed Image Edit v1.1 is an updated version of FireRed Image Edit, with improved image editing capabilities.","status":"active","release_date":"2026-03-05","model_type":"image","page_url":"https://fal.run/fal-ai/firered-image-edit-v1.1","tagline":"FireRed Image Edit v1.1 is an updated version of FireRed Image Edit, with improved image editing capabilities.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-05","last_updated":"2026-05-11"},{"id":"fal-ai/firered-image-edit","name":"Firered Image Edit","created_by":"fal","source":"official","description":"FireRed Image Edit is FireRed's state of the art open source editing model, re-trained from Qwen Image Edit 2509.","status":"active","release_date":"2026-02-19","model_type":"image","page_url":"https://fal.run/fal-ai/firered-image-edit","tagline":"FireRed Image Edit is FireRed's state of the art open source editing model, re-trained from Qwen Image Edit 2509.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-10","last_updated":"2026-06-18"},{"id":"fal-ai/flashhead","name":"Flashhead","created_by":"fal","source":"official","description":"SoulX-FlashHead is a unified 1.3B-parameter framework designed for high-fidelity, infinite-length, and real-time streaming portrait video generation.","status":"active","release_date":"2026-03-12","model_type":"video","page_url":"https://fal.run/fal-ai/flashhead","tagline":"SoulX-FlashHead is a unified 1.3B-parameter framework designed for high-fidelity, infinite-length, and real-time streaming portrait video generation.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/flashtalk","name":"Flashtalk","created_by":"fal","source":"official","description":"Audio-driven talking avatar generation powered by the SoulX-FlashTalk 14B model.","status":"active","release_date":"2026-03-12","model_type":"other","page_url":"https://fal.run/fal-ai/flashtalk","tagline":"Audio-driven talking avatar generation powered by the SoulX-FlashTalk 14B model.","last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/flashvsr/upscale/video","name":"Flashvsr","created_by":"fal","source":"official","description":"Upscale your videos using FlashVSR with the fastest speeds!","status":"active","release_date":"2025-11-11","model_type":"other","page_url":"https://fal.run/fal-ai/flashvsr/upscale/video","tagline":"Upscale your videos using FlashVSR with the fastest speeds!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/caption-to-phrase-grounding","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/caption-to-phrase-grounding","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/caption","name":"Florence 2 Large Caption","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"other","page_url":"https://fal.run/fal-ai/florence-2-large/caption","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/florence-2-large/dense-region-caption","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/dense-region-caption","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/detailed-caption","name":"Florence 2 Large Detailed Caption","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"other","page_url":"https://fal.run/fal-ai/florence-2-large/detailed-caption","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/florence-2-large/more-detailed-caption","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"other","page_url":"https://fal.run/fal-ai/florence-2-large/more-detailed-caption","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/object-detection","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/object-detection","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/ocr-with-region","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/ocr-with-region","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/ocr","name":"Florence 2 Large OCR","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"other","page_url":"https://fal.run/fal-ai/florence-2-large/ocr","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/florence-2-large/open-vocabulary-detection","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/open-vocabulary-detection","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/referring-expression-segmentation","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/referring-expression-segmentation","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/region-proposal","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/region-proposal","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/region-to-category","name":"Florence 2 Large Region To Category","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"other","page_url":"https://fal.run/fal-ai/florence-2-large/region-to-category","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/florence-2-large/region-to-description","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"other","page_url":"https://fal.run/fal-ai/florence-2-large/region-to-description","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/region-to-segmentation","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/region-to-segmentation","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flowedit","name":"Flow-Edit","created_by":"fal","source":"official","description":"The model provides you high quality image editing capabilities.","status":"active","release_date":"2025-02-14","model_type":"image","page_url":"https://fal.run/fal-ai/flowedit","tagline":"The model provides you high quality image editing capabilities.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-1/dev/image-to-image","name":"FLUX.1 [dev]","created_by":"fal","source":"official","description":"FLUX.1 [dev] is a 12 billion parameter flow transformer that generates high-quality images from text.","status":"active","release_date":"2025-06-02","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/dev/image-to-image","tagline":"FLUX.1 [dev] is a 12 billion parameter flow transformer that generates high-quality images from text.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-1/dev/redux","name":"FLUX.1 [dev] Redux","created_by":"fal","source":"official","description":"FLUX.1 [dev] Redux is a high-performance endpoint for the FLUX.1 [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with ","status":"active","release_date":"2025-06-02","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/dev/redux","tagline":"FLUX.1 [dev] Redux is a high-performance endpoint for the FLUX.1 [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-1/dev","name":"FLUX.1 [dev]","created_by":"fal","source":"official","description":"FLUX.1 [dev] is a 12 billion parameter flow transformer that generates high-quality images from text.","status":"active","release_date":"2025-06-02","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/dev","tagline":"FLUX.1 [dev] is a 12 billion parameter flow transformer that generates high-quality images from text.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-1/krea/image-to-image","name":"FLUX.1 Krea [dev]","created_by":"fal","source":"official","description":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-07-30","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/krea/image-to-image","tagline":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-1/krea/redux","name":"FLUX.1 Krea [dev] Redux","created_by":"fal","source":"official","description":"FLUX.1 Krea [dev] Redux is a high-performance endpoint for the FLUX.1 Krea [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificat","status":"active","release_date":"2025-07-30","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/krea/redux","tagline":"FLUX.1 Krea [dev] Redux is a high-performance endpoint for the FLUX.1 Krea [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificat","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-1/krea","name":"FLUX.1 Krea [dev]","created_by":"fal","source":"official","description":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-07-30","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/krea","tagline":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-1/schnell/redux","name":"FLUX.1 [schnell] Redux","created_by":"fal","source":"official","description":"FLUX.1 [schnell] Redux is a high-performance endpoint for the FLUX.1 [schnell] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with the core FLUX capabilities.","status":"active","release_date":"2025-06-02","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/schnell/redux","tagline":"FLUX.1 [schnell] Redux is a high-performance endpoint for the FLUX.1 [schnell] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificatio","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-1/schnell","name":"FLUX.1 [schnell]","created_by":"fal","source":"official","description":"Fastest inference in the world for the 12 billion parameter FLUX.1 [schnell] text-to-image model.","status":"active","release_date":"2025-06-02","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/schnell","tagline":"Fastest inference in the world for the 12 billion parameter FLUX.1 [schnell] text-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-19","last_updated":"2026-06-03"},{"id":"fal-ai/flux-1/srpo/image-to-image","name":"FLUX.1 SRPO [dev]","created_by":"fal","source":"official","description":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-09-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/srpo/image-to-image","tagline":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-1/srpo","name":"FLUX.1 SRPO [dev]","created_by":"fal","source":"official","description":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-09-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/srpo","tagline":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-2/edit","name":"FLUX 2 Edit","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-11-23","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/edit","tagline":"Image-to-image editing with FLUX.2 [dev] from Black Forest Labs.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2/flash/edit","name":"FLUX 2 Flash Edit","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/flash/edit","tagline":"Image-to-image editing with FLUX.2 [dev] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2/flash","name":"FLUX 2 Flash","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/flash","tagline":"Text-to-image generation with FLUX.2 [dev] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2-flex/edit","name":"Flux 2 Flex","created_by":"fal","source":"official","description":"Image editing with FLUX.2 [flex] from Black Forest Labs.","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-flex/edit","tagline":"Image editing with FLUX.2 [flex] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-flex","name":"Flux 2 Flex","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [flex] from Black Forest Labs.","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-flex","tagline":"Text-to-image generation with FLUX.2 [flex] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b/base/edit/lora","name":"FLUX.2 [klein] 4B Base LoRA","created_by":"fal","source":"official","description":"Image-to-image editing with LoRA support for FLUX.2 [klein] 4B Base from Black Forest Labs.","status":"active","release_date":"2026-01-19","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b/base/edit/lora","tagline":"Image-to-image editing with LoRA support for FLUX.2 [klein] 4B Base from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b/base/edit","name":"FLUX.2 [klein] 4B Base","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [klein] 4B Base from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b/base/edit","tagline":"Image-to-image editing with FLUX.2 [klein] 4B Base from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b/base/lora","name":"FLUX.2 [klein] 4B Base LoRA","created_by":"fal","source":"official","description":"Text-to-image generation with LoRA support for FLUX.2 [klein] 4B Base from Black Forest Labs.","status":"active","release_date":"2026-01-19","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b/base/lora","tagline":"Text-to-image generation with LoRA support for FLUX.2 [klein] 4B Base from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-klein-4b-base-trainer/edit","name":"Flux 2 Klein 4B Base Trainer","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [klein] 4B from Black Forest Labs with custom datasets.","status":"active","release_date":"2026-01-16","model_type":"other","parameters":4,"page_url":"https://fal.run/fal-ai/flux-2-klein-4b-base-trainer/edit","tagline":"Fine-tune FLUX.2 [klein] 4B from Black Forest Labs with custom datasets.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-klein-4b-base-trainer","name":"Flux 2 Klein 4B Base Trainer","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [klein] 4B from Black Forest Labs with custom datasets.","status":"active","release_date":"2026-01-17","model_type":"other","parameters":4,"page_url":"https://fal.run/fal-ai/flux-2-klein-4b-base-trainer","tagline":"Fine-tune FLUX.2 [klein] 4B from Black Forest Labs with custom datasets.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b/base","name":"FLUX.2 [klein] 4B Base","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [klein] 4B Base from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b/base","tagline":"Text-to-image generation with FLUX.2 [klein] 4B Base from Black Forest Labs.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b/edit/lora","name":"FLUX.2 [klein] 4B LoRA","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [klein] 4B from Black Forest Labs and custom LoRA.","status":"active","release_date":"2026-03-17","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b/edit/lora","tagline":"Image-to-image editing with FLUX.2 [klein] 4B from Black Forest Labs and custom LoRA.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b/edit","name":"FLUX.2 [klein] 4B","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [klein] 4B from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b/edit","tagline":"Image-to-image editing with FLUX.2 [klein] 4B from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b/lora","name":"FLUX.2 [klein] 4B LoRA","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [klein] 4B from Black Forest Labs and custom LoRA.","status":"active","release_date":"2026-03-17","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b/lora","tagline":"Text-to-image generation with FLUX.2 [klein] 4B from Black Forest Labs and custom LoRA.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b","name":"FLUX.2 [klein] 4B","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [klein] 4B from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b","tagline":"Text-to-image generation with FLUX.2 [klein] 4B from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/9b/base/edit/lora","name":"FLUX.2 [klein] 9B Base LoRA","created_by":"fal","source":"official","description":"Image-to-image editing with LoRA support for FLUX.2 [klein] 9B Base from Black Forest Labs.","status":"active","release_date":"2026-01-19","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b/base/edit/lora","tagline":"Image-to-image editing with LoRA support for FLUX.2 [klein] 9B Base from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/9b/base/edit","name":"FLUX.2 [klein] 9B Base","created_by":"fal","source":"official","description":"Image-to-image editing with Flux 2 [klein] 9B Base from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b/base/edit","tagline":"Image-to-image editing with Flux 2 [klein] 9B Base from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/9b/base/lora","name":"FLUX.2 [klein] 9B Base LoRA","created_by":"fal","source":"official","description":"Text-to-image generation with LoRA support for FLUX.2 [klein] 9B Base from Black Forest Labs.","status":"active","release_date":"2026-01-19","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b/base/lora","tagline":"Text-to-image generation with LoRA support for FLUX.2 [klein] 9B Base from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-klein-9b-base-trainer/edit","name":"Flux 2 Klein 9B Base Trainer","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [klein] 9B from Black Forest Labs with custom datasets.","status":"active","release_date":"2026-01-17","model_type":"other","parameters":9,"page_url":"https://fal.run/fal-ai/flux-2-klein-9b-base-trainer/edit","tagline":"Fine-tune FLUX.2 [klein] 9B from Black Forest Labs with custom datasets.","last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"fal-ai/flux-2-klein-9b-base-trainer","name":"FLUX 2 [klein] 9b Base Trainer","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [klein] 9B from Black Forest Labs with custom datasets.","status":"active","release_date":"2026-01-17","model_type":"other","parameters":9,"page_url":"https://fal.run/fal-ai/flux-2-klein-9b-base-trainer","tagline":"Fine-tune FLUX.2 [klein] 9B from Black Forest Labs with custom datasets.","last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"fal-ai/flux-2/klein/9b/base","name":"FLUX.2 [klein] 9B Base","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [klein] 9B Base from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b/base","tagline":"Text-to-image generation with FLUX.2 [klein] 9B Base from Black Forest Labs.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/9b/edit/lora","name":"FLUX.2 [klein] 9B LoRA","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [klein] 9B from Black Forest Labs and custom LoRA.","status":"active","release_date":"2026-03-17","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b/edit/lora","tagline":"Image-to-image editing with FLUX.2 [klein] 9B from Black Forest Labs and custom LoRA.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-20","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/9b/edit","name":"FLUX.2 [klein] 9B","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [klein] 9B from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b/edit","tagline":"Image-to-image editing with FLUX.2 [klein] 9B from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/9b/lora","name":"FLUX.2 [klein] 9B LoRA","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [klein] 9B from Black Forest Labs and custom LoRA.","status":"active","release_date":"2026-03-17","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b/lora","tagline":"Text-to-image generation with FLUX.2 [klein] 9B from Black Forest Labs and custom LoRA.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-20","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/9b","name":"FLUX.2 [klein] 9B","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [klein] 9B from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b","tagline":"Text-to-image generation with FLUX.2 [klein] 9B from Black Forest Labs.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/realtime","name":"Flux 2 [klein] Realtime","created_by":"fal","source":"official","description":"Realtime generation with FLUX.2 [klein] from Black Forest Labs.","status":"active","release_date":"2026-02-05","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/realtime","tagline":"Realtime generation with FLUX.2 [klein] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-02-09","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/lora/edit","name":"FLUX 2 Lora Edit","created_by":"fal","source":"official","description":"Image-to-image editing with LoRA support for FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-11-23","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/lora/edit","tagline":"Image-to-image editing with LoRA support for FLUX.2 [dev] from Black Forest Labs.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2-lora-gallery/add-background","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Add a background to images with white/clean background","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/add-background","tagline":"Add a background to images with white/clean background","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/apartment-staging","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Virtually furnishes an empty apartment","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/apartment-staging","tagline":"Virtually furnishes an empty apartment","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/ballpoint-pen-sketch","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Ballpoint pen sketch drawing style","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/ballpoint-pen-sketch","tagline":"Ballpoint pen sketch drawing style","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/digital-comic-art","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Transforms images into comic book style","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/digital-comic-art","tagline":"Transforms images into comic book style","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/face-to-full-portrait","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Extends a face into a full body portrait","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/face-to-full-portrait","tagline":"Extends a face into a full body portrait","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/hdr-style","name":"FLUX 2 Lora Gallery Hdr Style","created_by":"fal","source":"official","description":"HDR surrealistic effect with intense colors","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/hdr-style","tagline":"HDR surrealistic effect with intense colors","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2-lora-gallery/multiple-angles","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Generates same object from different angles (azimuth/elevation)","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/multiple-angles","tagline":"Generates same object from different angles (azimuth/elevation)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/realism","name":"FLUX 2 Lora Gallery Realism","created_by":"fal","source":"official","description":"Makes images more photorealistic and natural","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/realism","tagline":"Makes images more photorealistic and natural","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2-lora-gallery/satellite-view-style","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Generates satellite/aerial view style images","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/satellite-view-style","tagline":"Generates satellite/aerial view style images","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/sepia-vintage","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Applies sepia vintage effect to images","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/sepia-vintage","tagline":"Applies sepia vintage effect to images","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/virtual-tryon","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Virtual clothing try-on (2 images: person + garment)","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/virtual-tryon","tagline":"Virtual clothing try-on (2 images: person + garment)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/lora","name":"FLUX 2 Lora","created_by":"fal","source":"official","description":"Text-to-image generation with LoRA support for FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-11-23","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/lora","tagline":"Text-to-image generation with LoRA support for FLUX.2 [dev] from Black Forest Labs.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2-max/edit","name":"Flux 2 Max","created_by":"fal","source":"official","description":"FLUX.2 [max] delivers state-of-the-art image generation and advanced image editing with exceptional realism, precision, and consistency.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-max/edit","tagline":"FLUX.2 [max] delivers state-of-the-art image generation and advanced image editing with exceptional realism, precision, and consistency.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-24","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-max","name":"Flux 2 Max","created_by":"fal","source":"official","description":"FLUX.2 [max] delivers state-of-the-art image generation and advanced image editing with exceptional realism, precision, and consistency.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-max","tagline":"FLUX.2 [max] delivers state-of-the-art image generation and advanced image editing with exceptional realism, precision, and consistency.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-pro/edit","name":"FLUX 2 Pro Edit","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [pro] from Black Forest Labs.","status":"active","release_date":"2025-11-23","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-pro/edit","tagline":"Text-to-image generation with FLUX.2 [pro] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2-pro/outpaint","name":"FLUX 2 Pro Outpaint","created_by":"fal","source":"official","description":"Outpainting generation with FLUX.2 [pro] from Black Forest Labs.","status":"active","release_date":"2026-05-14","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-pro/outpaint","tagline":"Outpainting generation with FLUX.2 [pro] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-2-pro","name":"Flux 2 Pro","created_by":"fal","source":"official","description":"Image editing with FLUX.2 [pro] from Black Forest Labs.","status":"active","release_date":"2025-11-23","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-pro","tagline":"Image editing with FLUX.2 [pro] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-trainer/edit","name":"FLUX 2 Trainer Edit","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","status":"active","release_date":"2025-11-25","model_type":"other","page_url":"https://fal.run/fal-ai/flux-2-trainer/edit","tagline":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"fal-ai/flux-2-trainer-v2/edit","name":"FLUX 2 Trainer V2 Edit","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","status":"active","release_date":"2026-01-10","model_type":"other","page_url":"https://fal.run/fal-ai/flux-2-trainer-v2/edit","tagline":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"fal-ai/flux-2-trainer-v2","name":"FLUX 2 Trainer V2","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","status":"active","release_date":"2026-01-10","model_type":"other","page_url":"https://fal.run/fal-ai/flux-2-trainer-v2","tagline":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"fal-ai/flux-2-trainer","name":"FLUX 2 Trainer","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","status":"active","release_date":"2025-11-25","model_type":"other","page_url":"https://fal.run/fal-ai/flux-2-trainer","tagline":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"fal-ai/flux-2/turbo/edit","name":"FLUX 2 Turbo Edit","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/turbo/edit","tagline":"Image-to-image editing with FLUX.2 [dev] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2/turbo","name":"FLUX 2 Turbo","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/turbo","tagline":"Text-to-image generation with FLUX.2 [dev] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2","name":"FLUX 2","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-11-23","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2","tagline":"Text-to-image generation with FLUX.2 [dev] from Black Forest Labs.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-27","last_updated":"2026-06-03"},{"id":"fal-ai/flux-control-lora-canny/image-to-image","name":"FLUX.1 [dev] Control LoRA Canny","created_by":"fal","source":"official","description":"FLUX Control LoRA Canny is a high-performance endpoint that uses a control image using a Canny edge map to transfer structure to the generated image and another initial image to guide color.","status":"active","release_date":"2025-02-11","model_type":"image","page_url":"https://fal.run/fal-ai/flux-control-lora-canny/image-to-image","tagline":"FLUX Control LoRA Canny is a high-performance endpoint that uses a control image using a Canny edge map to transfer structure to the generated image and another initial image to guide color.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-control-lora-canny","name":"FLUX.1 [dev] Control LoRA Canny","created_by":"fal","source":"official","description":"FLUX Control LoRA Canny is a high-performance endpoint that uses a control image to transfer structure to the generated image, using a Canny edge map.","status":"active","release_date":"2025-02-11","model_type":"image","page_url":"https://fal.run/fal-ai/flux-control-lora-canny","tagline":"FLUX Control LoRA Canny is a high-performance endpoint that uses a control image to transfer structure to the generated image, using a Canny edge map.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-control-lora-depth/image-to-image","name":"FLUX.1 [dev] Control LoRA Depth","created_by":"fal","source":"official","description":"FLUX Control LoRA Depth is a high-performance endpoint that uses a control image using a depth map to transfer structure to the generated image and another initial image to guide color.","status":"active","release_date":"2025-02-11","model_type":"image","page_url":"https://fal.run/fal-ai/flux-control-lora-depth/image-to-image","tagline":"FLUX Control LoRA Depth is a high-performance endpoint that uses a control image using a depth map to transfer structure to the generated image and another initial image to guide color.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-control-lora-depth","name":"FLUX.1 [dev] Control LoRA Depth","created_by":"fal","source":"official","description":"FLUX Control LoRA Depth is a high-performance endpoint that uses a control image to transfer structure to the generated image, using a depth map.","status":"active","release_date":"2025-02-11","model_type":"image","page_url":"https://fal.run/fal-ai/flux-control-lora-depth","tagline":"FLUX Control LoRA Depth is a high-performance endpoint that uses a control image to transfer structure to the generated image, using a depth map.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux/dev/image-to-image","name":"FLUX.1 [dev]","created_by":"fal","source":"official","description":"FLUX.1 Image-to-Image is a high-performance endpoint for the FLUX.1 [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications wi","status":"active","release_date":"2024-07-11","model_type":"image","page_url":"https://fal.run/fal-ai/flux/dev/image-to-image","tagline":"FLUX.1 Image-to-Image is a high-performance endpoint for the FLUX.1 [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications wi","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux/dev/redux","name":"FLUX.1 [dev] Redux","created_by":"fal","source":"official","description":"FLUX.1 [dev] Redux is a high-performance endpoint for the FLUX.1 [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with ","status":"active","release_date":"2024-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/flux/dev/redux","tagline":"FLUX.1 [dev] Redux is a high-performance endpoint for the FLUX.1 [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux/dev","name":"FLUX.1 [dev]","created_by":"fal","source":"official","description":"FLUX.1 [dev] is a 12 billion parameter flow transformer that generates high-quality images from text.","status":"active","release_date":"2025-04-01","model_type":"image","page_url":"https://fal.run/fal-ai/flux/dev","tagline":"FLUX.1 [dev] is a 12 billion parameter flow transformer that generates high-quality images from text.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-differential-diffusion","name":"FLUX.1 [dev] Differential Diffusion","created_by":"fal","source":"official","description":"FLUX.1 Differential Diffusion is a rapid endpoint that enables swift, granular control over image transformations through change maps, delivering fast and precise region-specific modifications while m","status":"active","release_date":"2024-11-06","model_type":"image","page_url":"https://fal.run/fal-ai/flux-differential-diffusion","tagline":"FLUX.1 Differential Diffusion is a rapid endpoint that enables swift, granular control over image transformations through change maps, delivering fast and precise region-specific modifications while m","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-general/differential-diffusion","name":"FLUX.1 [dev] with Controlnets and Loras","created_by":"fal","source":"official","description":"A specialized FLUX endpoint combining differential diffusion control with LoRA, ControlNet, and IP-Adapter support, enabling precise, region-specific image transformations through customizable change ","status":"active","release_date":"2024-08-13","model_type":"image","page_url":"https://fal.run/fal-ai/flux-general/differential-diffusion","tagline":"A specialized FLUX endpoint combining differential diffusion control with LoRA, ControlNet, and IP-Adapter support, enabling precise, region-specific image transformations through customizable change ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-general/image-to-image","name":"FLUX.1 [dev] with Controlnets and Loras","created_by":"fal","source":"official","description":"FLUX General Image-to-Image is a versatile endpoint that transforms existing images with support for LoRA, ControlNet, and IP-Adapter extensions, enabling precise control over style transfer, modifica","status":"active","release_date":"2024-08-14","model_type":"image","page_url":"https://fal.run/fal-ai/flux-general/image-to-image","tagline":"FLUX General Image-to-Image is a versatile endpoint that transforms existing images with support for LoRA, ControlNet, and IP-Adapter extensions, enabling precise control over style transfer, modifica","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-general/inpainting","name":"FLUX.1 [dev] with Controlnets and Loras","created_by":"fal","source":"official","description":"FLUX General Inpainting is a versatile endpoint that enables precise image editing and completion, supporting multiple AI extensions including LoRA, ControlNet, and IP-Adapter for enhanced control ove","status":"active","release_date":"2024-08-14","model_type":"image","page_url":"https://fal.run/fal-ai/flux-general/inpainting","tagline":"FLUX General Inpainting is a versatile endpoint that enables precise image editing and completion, supporting multiple AI extensions including LoRA, ControlNet, and IP-Adapter for enhanced control ove","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-general/rf-inversion","name":"FLUX.1 [dev] with Controlnets and Loras","created_by":"fal","source":"official","description":"A general purpose endpoint for the FLUX.1 [dev] model, implementing the RF-Inversion pipeline.","status":"active","release_date":"2024-09-17","model_type":"image","page_url":"https://fal.run/fal-ai/flux-general/rf-inversion","tagline":"A general purpose endpoint for the FLUX.1 [dev] model, implementing the RF-Inversion pipeline.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-general","name":"FLUX.1 [dev] with Controlnets and Loras","created_by":"fal","source":"official","description":"A versatile endpoint for the FLUX.1 [dev] model that supports multiple AI extensions including LoRA, ControlNet conditioning, and IP-Adapter integration, enabling comprehensive control over image gene","status":"active","release_date":"2024-08-21","model_type":"image","page_url":"https://fal.run/fal-ai/flux-general","tagline":"A versatile endpoint for the FLUX.1 [dev] model that supports multiple AI extensions including LoRA, ControlNet conditioning, and IP-Adapter integration, enabling comprehensive control over image gene","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-kontext/dev","name":"FLUX.1 Kontext [dev]","created_by":"fal","source":"official","description":"Frontier image editing model.","status":"active","release_date":"2025-05-28","model_type":"image","page_url":"https://fal.run/fal-ai/flux-kontext/dev","tagline":"Frontier image editing model.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-kontext-lora/inpaint","name":"Flux Kontext Lora","created_by":"fal","source":"official","description":"Fast inpainting endpoint for the FLUX.1 Kontext [dev] model with LoRA support, enabling rapid and high-quality image inpainting with reference images, while using pre-trained LoRA adaptations for spec","status":"active","release_date":"2025-07-29","model_type":"image","page_url":"https://fal.run/fal-ai/flux-kontext-lora/inpaint","tagline":"Fast inpainting endpoint for the FLUX.1 Kontext [dev] model with LoRA support, enabling rapid and high-quality image inpainting with reference images, while using pre-trained LoRA adaptations for spec","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-kontext-lora/text-to-image","name":"Flux Kontext Lora","created_by":"fal","source":"official","description":"Super fast text-to-image endpoint for the FLUX.1 Kontext [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specifi","status":"active","release_date":"2025-06-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-kontext-lora/text-to-image","tagline":"Super fast text-to-image endpoint for the FLUX.1 Kontext [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specifi","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-kontext-lora","name":"Flux Kontext Lora","created_by":"fal","source":"official","description":"Fast endpoint for the FLUX.1 Kontext [dev] model with LoRA support, enabling rapid and high-quality image editing using pre-trained LoRA adaptations for specific styles, brand identities, and product-","status":"active","release_date":"2025-06-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-kontext-lora","tagline":"Fast endpoint for the FLUX.1 Kontext [dev] model with LoRA support, enabling rapid and high-quality image editing using pre-trained LoRA adaptations for specific styles, brand identities, and product-","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-kontext-trainer","name":"Flux Kontext Trainer","created_by":"fal","source":"official","description":"LoRA trainer for FLUX.1 Kontext [dev]","status":"active","release_date":"2025-06-26","model_type":"other","page_url":"https://fal.run/fal-ai/flux-kontext-trainer","tagline":"LoRA trainer for FLUX.1 Kontext [dev]","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux/krea/image-to-image","name":"FLUX.1 Krea [dev]","created_by":"fal","source":"official","description":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-07-30","model_type":"image","page_url":"https://fal.run/fal-ai/flux/krea/image-to-image","tagline":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-krea-lora/image-to-image","name":"FLUX.1 Krea [dev] with LoRAs","created_by":"fal","source":"official","description":"FLUX LoRA Image-to-Image is a high-performance endpoint that transforms existing images using FLUX models, leveraging LoRA adaptations to enable rapid and precise image style transfer, modifications, ","status":"active","release_date":"2025-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/flux-krea-lora/image-to-image","tagline":"FLUX LoRA Image-to-Image is a high-performance endpoint that transforms existing images using FLUX models, leveraging LoRA adaptations to enable rapid and precise image style transfer, modifications, ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-krea-lora/inpainting","name":"FLUX.1 Krea [dev] Inpainting with LoRAs","created_by":"fal","source":"official","description":"Super fast endpoint for the FLUX.1 [dev] inpainting model with LoRA support, enabling rapid and high-quality image inpaingting using pre-trained LoRA adaptations for personalization, specific styles, ","status":"active","release_date":"2025-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/flux-krea-lora/inpainting","tagline":"Super fast endpoint for the FLUX.1 [dev] inpainting model with LoRA support, enabling rapid and high-quality image inpaingting using pre-trained LoRA adaptations for personalization, specific styles, ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-krea-lora/stream","name":"Flux Krea Lora","created_by":"fal","source":"official","description":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","status":"active","release_date":"2025-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/flux-krea-lora/stream","tagline":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-krea-lora","name":"FLUX.1 Krea [dev] with LoRAs","created_by":"fal","source":"official","description":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","status":"active","release_date":"2025-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/flux-krea-lora","tagline":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux/krea/redux","name":"FLUX.1 Krea [dev] Redux","created_by":"fal","source":"official","description":"FLUX.1 Krea [dev] Redux is a high-performance endpoint for the FLUX.1 Krea [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificat","status":"active","release_date":"2025-07-30","model_type":"image","page_url":"https://fal.run/fal-ai/flux/krea/redux","tagline":"FLUX.1 Krea [dev] Redux is a high-performance endpoint for the FLUX.1 Krea [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificat","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-krea-trainer","name":"Train Flux Krea LoRA","created_by":"fal","source":"official","description":"Train styles, people and other subjects at blazing speeds using the FLUX.1 Krea [dev] base model.","status":"active","release_date":"2025-08-01","model_type":"other","page_url":"https://fal.run/fal-ai/flux-krea-trainer","tagline":"Train styles, people and other subjects at blazing speeds using the FLUX.1 Krea [dev] base model.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux/krea","name":"FLUX.1 Krea [dev]","created_by":"fal","source":"official","description":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-07-30","model_type":"image","page_url":"https://fal.run/fal-ai/flux/krea","tagline":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora-canny","name":"FLUX.1 [dev] Canny with LoRAs","created_by":"fal","source":"official","description":"Utilize Flux.1 [dev] Controlnet to generate high-quality images with precise control over composition, style, and structure through advanced edge detection and guidance mechanisms.","status":"active","release_date":"2025-01-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-lora-canny","tagline":"Utilize Flux.1 [dev] Controlnet to generate high-quality images with precise control over composition, style, and structure through advanced edge detection and guidance mechanisms.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora-depth","name":"FLUX.1 [dev] Depth with LoRAs","created_by":"fal","source":"official","description":"Generate high-quality images from depth maps using Flux.1 [dev] depth estimation model.","status":"active","release_date":"2024-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/flux-lora-depth","tagline":"Generate high-quality images from depth maps using Flux.1 [dev] depth estimation model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora-fast-training","name":"Train Flux LoRA","created_by":"fal","source":"official","description":"Train styles, people and other subjects at blazing speeds.","status":"active","release_date":"2025-01-01","model_type":"other","page_url":"https://fal.run/fal-ai/flux-lora-fast-training","tagline":"Train styles, people and other subjects at blazing speeds.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora-fill","name":"FLUX.1 [dev] Fill with LoRAs","created_by":"fal","source":"official","description":"FLUX.1 [dev] Fill is a high-performance endpoint for the FLUX.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with t","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/flux-lora-fill","tagline":"FLUX.1 [dev] Fill is a high-performance endpoint for the FLUX.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with t","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora/image-to-image","name":"FLUX.1 [dev] with LoRAs","created_by":"fal","source":"official","description":"FLUX LoRA Image-to-Image is a high-performance endpoint that transforms existing images using FLUX models, leveraging LoRA adaptations to enable rapid and precise image style transfer, modifications, ","status":"active","release_date":"2024-08-13","model_type":"image","page_url":"https://fal.run/fal-ai/flux-lora/image-to-image","tagline":"FLUX LoRA Image-to-Image is a high-performance endpoint that transforms existing images using FLUX models, leveraging LoRA adaptations to enable rapid and precise image style transfer, modifications, ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora/inpainting","name":"FLUX.1 [dev] Inpainting with LoRAs","created_by":"fal","source":"official","description":"Super fast endpoint for the FLUX.1 [dev] inpainting model with LoRA support, enabling rapid and high-quality image inpaingting using pre-trained LoRA adaptations for personalization, specific styles, ","status":"active","release_date":"2024-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/flux-lora/inpainting","tagline":"Super fast endpoint for the FLUX.1 [dev] inpainting model with LoRA support, enabling rapid and high-quality image inpaingting using pre-trained LoRA adaptations for personalization, specific styles, ","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora-portrait-trainer","name":"Train Flux LoRAs For Portraits","created_by":"fal","source":"official","description":"FLUX LoRA training optimized for portrait generation, with bright highlights, excellent prompt following and highly detailed results.","status":"active","release_date":"2024-11-07","model_type":"other","page_url":"https://fal.run/fal-ai/flux-lora-portrait-trainer","tagline":"FLUX LoRA training optimized for portrait generation, with bright highlights, excellent prompt following and highly detailed results.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-lora/stream","name":"Flux Lora","created_by":"fal","source":"official","description":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","status":"active","release_date":"2025-05-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-lora/stream","tagline":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora","name":"FLUX.1 [dev] with LoRAs","created_by":"fal","source":"official","description":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","status":"active","release_date":"2024-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/flux-lora","tagline":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-pro/kontext/max/multi","name":"FLUX.1 Kontext [max]","created_by":"fal","source":"official","description":"Experimental version of FLUX.1 Kontext [max] with multi image handling capabilities","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/kontext/max/multi","tagline":"Experimental version of FLUX.1 Kontext [max] with multi image handling capabilities","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-pro/kontext/max/text-to-image","name":"FLUX.1 Kontext [max]","created_by":"fal","source":"official","description":"FLUX.1 Kontext [max] text-to-image is a new premium model brings maximum performance across all aspects – greatly improved prompt adherence.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/kontext/max/text-to-image","tagline":"FLUX.1 Kontext [max] text-to-image is a new premium model brings maximum performance across all aspects – greatly improved prompt adherence.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/kontext/max","name":"FLUX.1 Kontext [max]","created_by":"fal","source":"official","description":"FLUX.1 Kontext [max] is a model with greatly improved prompt adherence and typography generation meet premium consistency for editing without compromise on speed.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/kontext/max","tagline":"FLUX.1 Kontext [max] is a model with greatly improved prompt adherence and typography generation meet premium consistency for editing without compromise on speed.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-pro/kontext/multi","name":"FLUX.1 Kontext [pro]","created_by":"fal","source":"official","description":"Experimental version of FLUX.1 Kontext [pro] with multi image handling capabilities","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/kontext/multi","tagline":"Experimental version of FLUX.1 Kontext [pro] with multi image handling capabilities","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/kontext/text-to-image","name":"FLUX.1 Kontext [pro]","created_by":"fal","source":"official","description":"The FLUX.1 Kontext [pro] text-to-image delivers state-of-the-art image generation results with unprecedented prompt following, photorealistic rendering, and flawless typography.","status":"active","release_date":"2025-05-28","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/kontext/text-to-image","tagline":"The FLUX.1 Kontext [pro] text-to-image delivers state-of-the-art image generation results with unprecedented prompt following, photorealistic rendering, and flawless typography.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-pro/kontext","name":"FLUX.1 Kontext [pro]","created_by":"fal","source":"official","description":"FLUX.1 Kontext [pro] handles both text and reference images as inputs, seamlessly enabling targeted, local edits and complex transformations of entire scenes.","status":"active","release_date":"2025-05-28","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/kontext","tagline":"FLUX.1 Kontext [pro] handles both text and reference images as inputs, seamlessly enabling targeted, local edits and complex transformations of entire scenes.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/v1/erase","name":"Flux Pro Erase","created_by":"fal","source":"official","description":"Latest object erasing model from Black Forest Labs.","status":"active","release_date":"2026-05-21","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1/erase","tagline":"Latest object erasing model from Black forest labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-18","last_updated":"2026-06-20"},{"id":"fal-ai/flux-pro/v1/fill-finetuned","name":"FLUX.1 [pro] Fill Fine-tuned","created_by":"fal","source":"official","description":"FLUX.1 [pro] Fill Fine-tuned is a high-performance endpoint for the FLUX.1 [pro] model with a fine-tuned LoRA that enables rapid transformation of existing images, delivering high-quality style transf","status":"active","release_date":"2025-01-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1/fill-finetuned","tagline":"FLUX.1 [pro] Fill Fine-tuned is a high-performance endpoint for the FLUX.1 [pro] model with a fine-tuned LoRA that enables rapid transformation of existing images, delivering high-quality style transf","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/v1/fill","name":"FLUX.1 [pro] Fill","created_by":"fal","source":"official","description":"FLUX.1 [pro] Fill is a high-performance endpoint for the FLUX.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with t","status":"active","release_date":"2024-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1/fill","tagline":"FLUX.1 [pro] Fill is a high-performance endpoint for the FLUX.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with t","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/v1/vto","name":"FLUX Virtual Try-On ","created_by":"fal","source":"official","description":"Generate virtual try-on results from a person image plus one or more garment references.","status":"active","release_date":"2026-05-27","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1/vto","tagline":"Generate virtual try-on results from a person image plus one or more garment references.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-pro/v1.1/redux","name":"FLUX1.1 [pro] Redux","created_by":"fal","source":"official","description":"FLUX1.1 [pro] Redux is a high-performance endpoint for the FLUX1.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications wit","status":"active","release_date":"2024-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1.1/redux","tagline":"FLUX1.1 [pro] Redux is a high-performance endpoint for the FLUX1.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications wit","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/v1.1-ultra-finetuned","name":"FLUX1.1 [pro] ultra Fine-tuned","created_by":"fal","source":"official","description":"FLUX1.1 [pro] ultra fine-tuned is the newest version of FLUX1.1 [pro] with a fine-tuned LoRA, maintaining professional-grade image quality while delivering up to 2K resolution with improved photo real","status":"active","release_date":"2025-01-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1.1-ultra-finetuned","tagline":"FLUX1.1 [pro] ultra fine-tuned is the newest version of FLUX1.1 [pro] with a fine-tuned LoRA, maintaining professional-grade image quality while delivering up to 2K resolution with improved photo real","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/v1.1-ultra/redux","name":"FLUX1.1 [pro] ultra Redux","created_by":"fal","source":"official","description":"FLUX1.1 [pro] ultra Redux is a high-performance endpoint for the FLUX1.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificatio","status":"active","release_date":"2024-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1.1-ultra/redux","tagline":"FLUX1.1 [pro] ultra Redux is a high-performance endpoint for the FLUX1.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificatio","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/v1.1-ultra","name":"FLUX1.1 [pro] ultra","created_by":"fal","source":"official","description":"FLUX1.1 [pro] ultra is the newest version of FLUX1.1 [pro], maintaining professional-grade image quality while delivering up to 2K resolution with improved photo realism.","status":"active","release_date":"2024-12-17","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1.1-ultra","tagline":"FLUX1.1 [pro] ultra is the newest version of FLUX1.1 [pro], maintaining professional-grade image quality while delivering up to 2K resolution with improved photo realism.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/v1.1","name":"FLUX1.1 [pro]","created_by":"fal","source":"official","description":"FLUX1.1 [pro] is an enhanced version of FLUX.1 [pro], improved image generation capabilities, delivering superior composition, detail, and artistic fidelity compared to its predecessor.","status":"active","release_date":"2025-01-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1.1","tagline":"FLUX1.1 [pro] is an enhanced version of FLUX.1 [pro], improved image generation capabilities, delivering superior composition, detail, and artistic fidelity compared to its predecessor.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pulid","name":"PuLID Flux","created_by":"fal","source":"official","description":"An endpoint for personalized image generation using Flux as per given description.","status":"active","release_date":"2024-10-29","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pulid","tagline":"An endpoint for personalized image generation using Flux as per given description.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-10","last_updated":"2026-05-11"},{"id":"fal-ai/flux/schnell/redux","name":"FLUX.1 [schnell] Redux","created_by":"fal","source":"official","description":"FLUX.1 [schnell] Redux is a high-performance endpoint for the FLUX.1 [schnell] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificatio","status":"active","release_date":"2024-11-27","model_type":"image","page_url":"https://fal.run/fal-ai/flux/schnell/redux","tagline":"FLUX.1 [schnell] Redux is a high-performance endpoint for the FLUX.1 [schnell] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificatio","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux/schnell","name":"FLUX.1 [schnell]","created_by":"fal","source":"official","description":"FLUX.1 [schnell] is a 12 billion parameter flow transformer that generates high-quality images from text in 1 to 4 steps, suitable for personal and commercial use.","status":"active","release_date":"2024-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux/schnell","tagline":"FLUX.1 [schnell] is a 12 billion parameter flow transformer that generates high-quality images from text in 1 to 4 steps, suitable for personal and commercial use.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux/srpo/image-to-image","name":"FLUX.1 SRPO [dev]","created_by":"fal","source":"official","description":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-09-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux/srpo/image-to-image","tagline":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux/srpo","name":"FLUX.1 SRPO [dev]","created_by":"fal","source":"official","description":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-09-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux/srpo","tagline":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-subject","name":"FLUX.1 Subject","created_by":"fal","source":"official","description":"Super fast endpoint for the FLUX.1 [schnell] model with subject input capabilities, enabling rapid and high-quality image generation for personalization, specific styles, brand identities, and product","status":"active","release_date":"2024-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/flux-subject","tagline":"Super fast endpoint for the FLUX.1 [schnell] model with subject input capabilities, enabling rapid and high-quality image generation for personalization, specific styles, brand identities, and product","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/flux-vision-upscaler","name":"Flux Vision Upscaler","created_by":"fal","source":"official","description":"Flux Vision Upscaler for magnify/upscaling images with high fidelity and creativity.","status":"active","release_date":"2025-11-02","model_type":"image","page_url":"https://fal.run/fal-ai/flux-vision-upscaler","tagline":"Flux Vision Upscaler for magnify/upscaling images with high fidelity and creativity.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fooocus/image-prompt","name":"Fooocus Image Prompt","created_by":"fal","source":"official","description":"Default parameters with automated optimizations and quality improvements.","status":"active","release_date":"2024-02-13","model_type":"image","page_url":"https://fal.run/fal-ai/fooocus/image-prompt","tagline":"Default parameters with automated optimizations and quality improvements.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fooocus/inpaint","name":"Fooocus Inpainting","created_by":"fal","source":"official","description":"Default parameters with automated optimizations and quality improvements.","status":"active","release_date":"2024-02-13","model_type":"image","page_url":"https://fal.run/fal-ai/fooocus/inpaint","tagline":"Default parameters with automated optimizations and quality improvements.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fooocus/upscale-or-vary","name":"Fooocus Upscale or Vary","created_by":"fal","source":"official","description":"Default parameters with automated optimizations and quality improvements.","status":"active","release_date":"2024-08-12","model_type":"image","page_url":"https://fal.run/fal-ai/fooocus/upscale-or-vary","tagline":"Default parameters with automated optimizations and quality improvements.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fooocus","name":"Fooocus","created_by":"fal","source":"official","description":"Default parameters with automated optimizations and quality improvements.","status":"active","release_date":"2023-11-16","model_type":"image","page_url":"https://fal.run/fal-ai/fooocus","tagline":"Default parameters with automated optimizations and quality improvements.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/framepack/f1","name":"Framepack F1","created_by":"fal","source":"official","description":"Framepack is an efficient Image-to-video model that autoregressively generates videos.","status":"active","release_date":"2025-05-13","model_type":"video","page_url":"https://fal.run/fal-ai/framepack/f1","tagline":"Framepack is an efficient Image-to-video model that autoregressively generates videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/framepack/flf2v","name":"Framepack","created_by":"fal","source":"official","description":"Framepack is an efficient Image-to-video model that autoregressively generates videos.","status":"active","release_date":"2025-04-22","model_type":"video","page_url":"https://fal.run/fal-ai/framepack/flf2v","tagline":"Framepack is an efficient Image-to-video model that autoregressively generates videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/framepack","name":"Framepack","created_by":"fal","source":"official","description":"Framepack is an efficient Image-to-video model that autoregressively generates videos.","status":"active","release_date":"2025-04-17","model_type":"video","page_url":"https://fal.run/fal-ai/framepack","tagline":"Framepack is an efficient Image-to-video model that autoregressively generates videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/gemini-25-flash-image/edit","name":"Gemini 2.5 Flash Image","created_by":"fal","source":"official","family":"gemini-25","description":"Google's famous original image generation and editing model, a.k.a Nano Banana","status":"active","release_date":"2025-08-26","model_type":"image","page_url":"https://fal.run/fal-ai/gemini-25-flash-image/edit","tagline":"Google's famous original image generation and editing model, a.k.a Nano Banana","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/gemini-25-flash-image","name":"Gemini 2.5 Flash Image","created_by":"fal","source":"official","family":"gemini-25","description":"Google's famous original image generation and editing model, a.k.a Nano Banana","status":"active","release_date":"2025-08-26","model_type":"image","page_url":"https://fal.run/fal-ai/gemini-25-flash-image","tagline":"Google's famous original image generation and editing model, a.k.a Nano Banana","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/gemini-3-pro-image-preview/edit","name":"Gemini 3 Pro Image Preview","created_by":"fal","source":"official","family":"gemini-3","description":"Gemini 3 Pro Image (a.k.a Nano Banana Pro) is Google's state-of-the-art high-fidelity image generation and editing model","status":"active","release_date":"2025-11-20","model_type":"image","page_url":"https://fal.run/fal-ai/gemini-3-pro-image-preview/edit","tagline":"Gemini 3 Pro Image (a.k.a Nano Banana Pro) is Google's state-of-the-art high-fidelity image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/gemini-3-pro-image-preview","name":"Gemini 3 Pro Image Preview","created_by":"fal","source":"official","family":"gemini-3","description":"Gemini 3 Pro Image (a.k.a Nano Banana Pro) is Google's state-of-the-art high-fidelity image generation and editing model","status":"active","release_date":"2025-11-20","model_type":"image","page_url":"https://fal.run/fal-ai/gemini-3-pro-image-preview","tagline":"Gemini 3 Pro Image (a.k.a Nano Banana Pro) is Google's state-of-the-art high-fidelity image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/gemini-3.1-flash-image-preview/edit","name":"Gemini 3.1 Flash Image Preview","created_by":"fal","source":"official","family":"gemini-3.1","description":"Gemini 3.1 Flash Image (a.k.a.","status":"active","release_date":"2026-02-26","model_type":"image","page_url":"https://fal.run/fal-ai/gemini-3.1-flash-image-preview/edit","tagline":"Gemini 3.1 Flash Image (a.k.a.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/gemini-3.1-flash-image-preview","name":"Gemini 3.1 Flash Image Preview","created_by":"fal","source":"official","family":"gemini-3.1","description":"Gemini 3.1 Flash Image (a.k.a Nano Banana 2) is Google's new state-of-the-art fast image generation and editing model","status":"active","release_date":"2026-02-26","model_type":"image","page_url":"https://fal.run/fal-ai/gemini-3.1-flash-image-preview","tagline":"Gemini 3.1 Flash Image (a.k.a Nano Banana 2) is Google's new state-of-the-art fast image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/gemini-3.1-flash-tts","name":"Gemini 3.1 Flash Tts","created_by":"fal","source":"official","family":"gemini-3.1","description":"Newest audio model from Google introduces granular audio tags that give you precise control to direct AI speech for expressive audio generation.","status":"active","release_date":"2026-04-16","model_type":"tts","page_url":"https://fal.run/fal-ai/gemini-3.1-flash-tts","tagline":"Newest audio model from Google introduces granular audio tags that give you precise control to direct AI speech for expressive audio generation.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/gemini-tts","name":"Gemini TTS","created_by":"fal","source":"official","description":"Use Gemini TTS Models to convert your prompts to real audio.","status":"active","release_date":"2026-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/gemini-tts","tagline":"Use Gemini TTS Models to convert your prompts to real audio.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/genfocus/all-in-focus","name":"Genfocus","created_by":"fal","source":"official","description":"GenFocus Model to Refocus Images","status":"active","release_date":"2026-02-14","model_type":"image","page_url":"https://fal.run/fal-ai/genfocus/all-in-focus","tagline":"GenFocus Model to Refocus Images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-02-14","last_updated":"2026-05-11"},{"id":"fal-ai/genfocus","name":"Genfocus","created_by":"fal","source":"official","description":"GenFocus Model to Refocus Images","status":"active","release_date":"2026-02-14","model_type":"image","page_url":"https://fal.run/fal-ai/genfocus","tagline":"GenFocus Model to Refocus Images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-02-14","last_updated":"2026-05-11"},{"id":"fal-ai/ghiblify","name":"Ghiblify Images","created_by":"fal","source":"official","description":"Reimagine and transform your ordinary photos into enchanting Studio Ghibli style artwork","status":"active","release_date":"2025-03-31","model_type":"image","page_url":"https://fal.run/fal-ai/ghiblify","tagline":"Reimagine and transform your ordinary photos into enchanting Studio Ghibli style artwork","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/glm-image/image-to-image","name":"Glm Image","created_by":"fal","source":"official","family":"glm","description":"Create high-quality images with accurate text rendering and rich knowledge details—supports editing, style transfer, and maintaining consistent characters across multiple images.","status":"active","release_date":"2026-01-14","model_type":"image","page_url":"https://fal.run/fal-ai/glm-image/image-to-image","tagline":"Create high-quality images with accurate text rendering and rich knowledge details—supports editing, style transfer, and maintaining consistent characters across multiple images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/glm-image","name":"Glm Image","created_by":"fal","source":"official","family":"glm","description":"Create high-quality images with accurate text rendering and rich knowledge details—supports editing, style transfer, and maintaining consistent characters across multiple images.","status":"active","release_date":"2026-01-14","model_type":"image","page_url":"https://fal.run/fal-ai/glm-image","tagline":"Create high-quality images with accurate text rendering and rich knowledge details—supports editing, style transfer, and maintaining consistent characters across multiple images.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/goal-force","name":"Goal Force","created_by":"fal","source":"official","description":"Physics-based video generation with Goal Force.","status":"active","release_date":"2026-03-17","model_type":"video","page_url":"https://fal.run/fal-ai/goal-force","tagline":"Physics-based video generation with Goal Force.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/got-ocr/v2","name":"GOT OCR 2.0","created_by":"fal","source":"official","description":"GOT-OCR2 works on a wide range of tasks, including plain document OCR, scene text OCR, formatted document OCR, and even OCR for tables, charts, mathematical formulas, geometric shapes, molecular formu","status":"active","release_date":"2025-02-12","model_type":"other","page_url":"https://fal.run/fal-ai/got-ocr/v2","tagline":"GOT-OCR2 works on a wide range of tasks, including plain document OCR, scene text OCR, formatted document OCR, and even OCR for tables, charts, mathematical formulas, geometric shapes, molecular formu","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/gpt-image-1/edit-image","name":"gpt-image-1","created_by":"fal","source":"official","family":"gpt-image-1","description":"OpenAI's latest image generation and editing model: gpt-1-image.","status":"active","release_date":"2025-04-23","model_type":"image","page_url":"https://fal.run/fal-ai/gpt-image-1/edit-image","tagline":"OpenAI's latest image generation and editing model: gpt-1-image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/gpt-image-1-mini/edit","name":"GPT Image 1 Mini","created_by":"fal","source":"official","family":"gpt-image-1","description":"GPT Image 1 mini combines OpenAI's advanced language capabilities, powered by GPT-5, with GPT Image 1 Mini for efficient image generation.","status":"active","release_date":"2025-10-21","model_type":"image","page_url":"https://fal.run/fal-ai/gpt-image-1-mini/edit","tagline":"GPT Image 1 mini combines OpenAI's advanced language capabilities, powered by GPT-5, with GPT Image 1 Mini for efficient image generation.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/gpt-image-1-mini","name":"GPT Image 1 Mini","created_by":"fal","source":"official","family":"gpt-image-1","description":"GPT Image 1 mini combines OpenAI's advanced language capabilities, powered by GPT-5, with GPT Image 1 Mini for efficient image generation.","status":"active","release_date":"2025-10-21","model_type":"image","page_url":"https://fal.run/fal-ai/gpt-image-1-mini","tagline":"GPT Image 1 mini combines OpenAI's advanced language capabilities, powered by GPT-5, with GPT Image 1 Mini for efficient image generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/gpt-image-1/text-to-image","name":"gpt-image-1","created_by":"fal","source":"official","family":"gpt-image-1","description":"OpenAI's latest image generation and editing model: gpt-1-image.","status":"active","release_date":"2025-04-23","model_type":"image","page_url":"https://fal.run/fal-ai/gpt-image-1/text-to-image","tagline":"OpenAI's latest image generation and editing model: gpt-1-image.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/gpt-image-1.5/edit","name":"GPT-Image 1.5","created_by":"fal","source":"official","family":"gpt-image-1.5","description":"GPT Image 1.5 generates high-fidelity images with strong prompt adherence, preserving composition, lighting, and fine-grained detail.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/gpt-image-1.5/edit","tagline":"GPT Image 1.5 generates high-fidelity images with strong prompt adherence, preserving composition, lighting, and fine-grained detail.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/gpt-image-1.5","name":"GPT-Image 1.5","created_by":"fal","source":"official","family":"gpt-image-1.5","description":"GPT Image 1.5 generates high-fidelity images with strong prompt adherence, preserving composition, lighting, and fine-grained detail.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/gpt-image-1.5","tagline":"GPT Image 1.5 generates high-fidelity images with strong prompt adherence, preserving composition, lighting, and fine-grained detail.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/avatar3/digital-twin","name":"Heygen","created_by":"fal","source":"official","description":"Heygen Avatar V3 Model for Digital Twin","status":"active","release_date":"2026-02-23","model_type":"video","page_url":"https://fal.run/fal-ai/heygen/avatar3/digital-twin","tagline":"Heygen Avatar V3 Model for Digital Twin","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/avatar4/digital-twin","name":"Heygen","created_by":"fal","source":"official","description":"Heygen Avatar 4 Digital Twin Model","status":"active","release_date":"2026-02-23","model_type":"video","page_url":"https://fal.run/fal-ai/heygen/avatar4/digital-twin","tagline":"Heygen Avatar 4 Digital Twin Model","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/avatar4/image-to-video","name":"Heygen","created_by":"fal","source":"official","description":"Heygen Photo Avatar 4 Model","status":"active","release_date":"2026-02-23","model_type":"video","page_url":"https://fal.run/fal-ai/heygen/avatar4/image-to-video","tagline":"Heygen Photo Avatar 4 Model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/avatar5/digital-twin","name":"Heygen v5 Digital Twin","created_by":"fal","source":"official","description":"Create natural HeyGen Avatar V digital twin videos from text or audio, with lip-sync, optional backgrounds, captions, and MP4/WebM output.","status":"active","release_date":"2026-05-17","model_type":"video","page_url":"https://fal.run/fal-ai/heygen/avatar5/digital-twin","tagline":"Create natural HeyGen Avatar V digital twin videos from text or audio, with lip-sync, optional backgrounds, captions, and MP4/WebM output.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"fal-ai/heygen/v2/translate/precision","name":"Heygen","created_by":"fal","source":"official","description":"Heygen Translate Model with Extreme Precision","status":"active","release_date":"2026-02-23","model_type":"other","page_url":"https://fal.run/fal-ai/heygen/v2/translate/precision","tagline":"Heygen Translate Model with Extreme Precision","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/v2/translate/speed","name":"Heygen","created_by":"fal","source":"official","description":"Heygen Translate Model with Extreme Speed","status":"active","release_date":"2026-02-23","model_type":"other","page_url":"https://fal.run/fal-ai/heygen/v2/translate/speed","tagline":"Heygen Translate Model with Extreme Speed","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/v2/video-agent","name":"Heygen","created_by":"fal","source":"official","description":"Heygen Text to Video Generation Model","status":"active","release_date":"2026-02-15","model_type":"video","page_url":"https://fal.run/fal-ai/heygen/v2/video-agent","tagline":"Heygen Text to Video Generation Model","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/v3/lipsync/precision","name":"Heygen Lipsync - Precision","created_by":"fal","source":"official","description":"Replace or dub audio on an existing video with high-accuracy avatar-inference lip-sync.","status":"active","release_date":"2026-04-14","model_type":"other","page_url":"https://fal.run/fal-ai/heygen/v3/lipsync/precision","tagline":"Replace or dub audio on an existing video with high-accuracy avatar-inference lip-sync.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/v3/lipsync/speed","name":"Heygen Lipsync - Speed","created_by":"fal","source":"official","description":"Replace or dub audio on an existing video with fast audio-only lip-sync.","status":"active","release_date":"2026-04-14","model_type":"other","page_url":"https://fal.run/fal-ai/heygen/v3/lipsync/speed","tagline":"Replace or dub audio on an existing video with fast audio-only lip-sync.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/v3/video-agent","name":"Heygen Video Agent","created_by":"fal","source":"official","description":"Generate videos with a single prompt.","status":"active","release_date":"2026-04-16","model_type":"video","page_url":"https://fal.run/fal-ai/heygen/v3/video-agent","tagline":"Generate videos with a single prompt.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/hidream-e1-1","name":"Hidream E1 1","created_by":"fal","source":"official","description":"Edit images with natural language","status":"active","release_date":"2025-07-23","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-e1-1","tagline":"Edit images with natural language","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hidream-i1-dev","name":"Hidream I1 Dev","created_by":"fal","source":"official","description":"HiDream-I1 dev is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within seconds.","status":"active","release_date":"2025-04-11","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-i1-dev","tagline":"HiDream-I1 dev is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within seconds.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hidream-i1-fast","name":"Hidream I1 Fast","created_by":"fal","source":"official","description":"HiDream-I1 fast is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within 16 steps.","status":"active","release_date":"2025-04-11","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-i1-fast","tagline":"HiDream-I1 fast is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within 16 steps.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hidream-i1-full/image-to-image","name":"Hidream I1 Full","created_by":"fal","source":"official","description":"HiDream-I1 full is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within seconds.","status":"active","release_date":"2025-05-05","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-i1-full/image-to-image","tagline":"HiDream-I1 full is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within seconds.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hidream-i1-full","name":"Hidream I1 Full","created_by":"fal","source":"official","description":"HiDream-I1 full is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within seconds.","status":"active","release_date":"2025-04-11","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-i1-full","tagline":"HiDream-I1 full is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within seconds.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hidream-o1-image/dev/edit","name":"Hidream O1 Image","created_by":"fal","source":"official","description":"Unified image generation with HiDream-O1-Image.","status":"active","release_date":"2026-05-09","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-o1-image/dev/edit","tagline":"Unified image generation with HiDream-O1-Image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-10","last_updated":"2026-05-11"},{"id":"fal-ai/hidream-o1-image/dev","name":"Hidream O1 Image","created_by":"fal","source":"official","description":"Unified image generation with HiDream-O1-Image.","status":"active","release_date":"2026-05-09","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-o1-image/dev","tagline":"Unified image generation with HiDream-O1-Image.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-10","last_updated":"2026-05-11"},{"id":"fal-ai/hidream-o1-image/edit","name":"Hidream O1 Image","created_by":"fal","source":"official","description":"Unified image generation with HiDream-O1-Image.","status":"active","release_date":"2026-05-09","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-o1-image/edit","tagline":"Unified image generation with HiDream-O1-Image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-10","last_updated":"2026-05-11"},{"id":"fal-ai/hidream-o1-image","name":"Hidream O1 Image","created_by":"fal","source":"official","description":"Unified image generation with HiDream-O1-Image.","status":"active","release_date":"2026-05-09","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-o1-image","tagline":"Unified image generation with HiDream-O1-Image.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-10","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-3d/v3.1/part","name":"Hunyuan 3D Part Splitter","created_by":"fal","source":"official","description":"Split 3D models into parts with Hunyuan 3D","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-3d/v3.1/part","tagline":"Split 3D models into parts with Hunyuan 3D","last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-3d/v3.1/pro/image-to-3d","name":"Hunyuan 3D Pro Image to 3D","created_by":"fal","source":"official","description":"Generate 3D models from images with Hunyuan 3D Pro","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-3d/v3.1/pro/image-to-3d","tagline":"Generate 3D models from images with Hunyuan 3D Pro","capabilities":{"vision":true},"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-3d/v3.1/pro/text-to-3d","name":"Hunyuan 3D Pro Text to 3D","created_by":"fal","source":"official","description":"Generate 3D models from text prompts with Hunyuan 3D Pro","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-3d/v3.1/pro/text-to-3d","tagline":"Generate 3D models from text prompts with Hunyuan 3D Pro","last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-3d/v3.1/rapid/image-to-3d","name":"Hunyuan 3D Rapid Image to 3D","created_by":"fal","source":"official","description":"Rapidly generate 3D models from images using Hunyuan 3D.","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-3d/v3.1/rapid/image-to-3d","tagline":"Rapidly generate 3D models from images using Hunyuan 3D.","capabilities":{"vision":true},"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-3d/v3.1/rapid/text-to-3d","name":"Hunyuan 3d","created_by":"fal","source":"official","description":"Create detailed, fully-textured 3D models with text","status":"active","release_date":"2026-01-29","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-3d/v3.1/rapid/text-to-3d","tagline":"Create detailed, fully-textured 3D models with text","last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-3d/v3.1/smart-topology","name":"Hunyuan 3D Smart Topology","created_by":"fal","source":"official","description":"Optimize 3D mesh topology with Hunyuan 3D Smart Topology.","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-3d/v3.1/smart-topology","tagline":"Optimize 3D mesh topology with Hunyuan 3D Smart Topology.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-avatar","name":"Hunyuan Avatar","created_by":"fal","source":"official","description":"HunyuanAvatar is a High-Fidelity Audio-Driven Human Animation model for Multiple Characters .","status":"active","release_date":"2025-05-29","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-avatar","tagline":"HunyuanAvatar is a High-Fidelity Audio-Driven Human Animation model for Multiple Characters .","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-custom","name":"Hunyuan Custom","created_by":"fal","source":"official","description":"HunyuanCustom revolutionizes video generation with unmatched identity consistency across multiple input types.","status":"active","release_date":"2025-05-14","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-custom","tagline":"HunyuanCustom revolutionizes video generation with unmatched identity consistency across multiple input types.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-image/v2.1/text-to-image","name":"Hunyuan Image","created_by":"fal","source":"official","description":"Use the amazing capabilities of hunyuan image 2.1 to generate images that express the feelings of your text.","status":"active","release_date":"2025-09-09","model_type":"image","page_url":"https://fal.run/fal-ai/hunyuan-image/v2.1/text-to-image","tagline":"Use the amazing capabilities of hunyuan image 2.1 to generate images that express the feelings of your text.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hunyuan-image/v3/instruct/edit","name":"Hunyuan Image","created_by":"fal","source":"official","description":"Image editing endpoint for Hunyuan Image 3.0 Instruct.","status":"active","release_date":"2026-01-28","model_type":"image","page_url":"https://fal.run/fal-ai/hunyuan-image/v3/instruct/edit","tagline":"Image editing endpoint for Hunyuan Image 3.0 Instruct.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-28","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-image/v3/instruct/text-to-image","name":"Hunyuan Image 3.0 Instruct","created_by":"fal","source":"official","description":"Instruct version of Hunyuan-Image 3.0, with internal reasoning capabilities.","status":"active","release_date":"2026-01-28","model_type":"image","page_url":"https://fal.run/fal-ai/hunyuan-image/v3/instruct/text-to-image","tagline":"Instruct version of Hunyuan-Image 3.0, with internal reasoning capabilities.","capabilities":{"vision":true,"reasoning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-14","last_updated":"2026-06-03"},{"id":"fal-ai/hunyuan-image/v3/text-to-image","name":"Hunyuan Image","created_by":"fal","source":"official","description":"Leverage the state-of-the-art capabilities of Hunyuan Image 3.0 to generate visual content that effectively conveys the messaging of your written material.","status":"active","release_date":"2025-09-28","model_type":"image","page_url":"https://fal.run/fal-ai/hunyuan-image/v3/text-to-image","tagline":"Leverage the state-of-the-art capabilities of Hunyuan Image 3.0 to generate visual content that effectively conveys the messaging of your written material.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-motion/fast","name":"Hunyuan Motion [0.46B]","created_by":"fal","source":"official","description":"Generate 3D human motions via text-to-generation interface of Hunyuan Motion!","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-motion/fast","tagline":"Generate 3D human motions via text-to-generation interface of Hunyuan Motion!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-motion","name":"Hunyuan Motion [1B]","created_by":"fal","source":"official","description":"Generate 3D human motions via text-to-generation interface of Hunyuan Motion!","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-motion","tagline":"Generate 3D human motions via text-to-generation interface of Hunyuan Motion!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-part","name":"Hunyuan Part","created_by":"fal","source":"official","description":"Use the capabilities of hunyuan part to generate point clouds from your 3D files.","status":"active","release_date":"2025-10-08","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-part","tagline":"Use the capabilities of hunyuan part to generate point clouds from your 3D files.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-portrait","name":"Hunyuan Portrait","created_by":"fal","source":"official","description":"HunyuanPortrait is a diffusion-based framework for generating lifelike, temporally consistent portrait animations.","status":"active","release_date":"2025-05-27","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-portrait","tagline":"HunyuanPortrait is a diffusion-based framework for generating lifelike, temporally consistent portrait animations.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video-foley","name":"Hunyuan Video Foley","created_by":"fal","source":"official","description":"Use the capabilities of the hunyuan foley model to bring life to your videos by adding sound effect to them.","status":"active","release_date":"2025-09-08","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-video-foley","tagline":"Use the capabilities of the hunyuan foley model to bring life to your videos by adding sound effect to them.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hunyuan-video-image-to-video","name":"Hunyuan Video Image-to-Video Inference","created_by":"fal","source":"official","description":"Image to Video for the high-quality Hunyuan Video I2V model.","status":"active","release_date":"2025-03-06","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-video-image-to-video","tagline":"Image to Video for the high-quality Hunyuan Video I2V model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video-img2vid-lora","name":"Hunyuan Video Image-to-Video LoRA Inference","created_by":"fal","source":"official","description":"Image to Video for the Hunyuan Video model using a custom trained LoRA.","status":"active","release_date":"2025-02-03","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-video-img2vid-lora","tagline":"Image to Video for the Hunyuan Video model using a custom trained LoRA.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video-lora-training","name":"Train Hunyuan LoRA","created_by":"fal","source":"official","description":"Train Hunyuan Video lora on people, objects, characters and more!","status":"active","release_date":"2025-01-14","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-video-lora-training","tagline":"Train Hunyuan Video lora on people, objects, characters and more!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video-lora/video-to-video","name":"Hunyuan Video LoRA Inference (Video-to-Video)","created_by":"fal","source":"official","description":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability.","status":"active","release_date":"2025-01-30","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-video-lora/video-to-video","tagline":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video-lora","name":"Hunyuan Video LoRA Inference","created_by":"fal","source":"official","description":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability","status":"active","release_date":"2025-01-16","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-video-lora","tagline":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video-v1.5/image-to-video","name":"Hunyuan Video V1.5","created_by":"fal","source":"official","description":"Hunyuan Video 1.5 is Tencent's latest and best video model","status":"active","release_date":"2025-12-17","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-video-v1.5/image-to-video","tagline":"Hunyuan Video 1.5 is Tencent's latest and best video model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video-v1.5/text-to-video","name":"Hunyuan Video V1.5","created_by":"fal","source":"official","description":"Hunyuan Video 1.5 is Tencent's latest and best video model","status":"active","release_date":"2025-11-21","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-video-v1.5/text-to-video","tagline":"Hunyuan Video 1.5 is Tencent's latest and best video model","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video/video-to-video","name":"Hunyuan Video (Video-to-Video)","created_by":"fal","source":"official","description":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability.","status":"active","release_date":"2025-01-30","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-video/video-to-video","tagline":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video","name":"Hunyuan Video","created_by":"fal","source":"official","description":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability.","status":"active","release_date":"2024-10-22","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-video","tagline":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan3d/v2/mini/turbo","name":"Hunyuan3D","created_by":"fal","source":"official","description":"Generate 3D models from your images using Hunyuan 3D.","status":"active","release_date":"2025-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d/v2/mini/turbo","tagline":"Generate 3D models from your images using Hunyuan 3D.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan3d/v2/mini","name":"Hunyuan3D","created_by":"fal","source":"official","description":"Generate 3D models from your images using Hunyuan 3D.","status":"active","release_date":"2025-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d/v2/mini","tagline":"Generate 3D models from your images using Hunyuan 3D.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan3d/v2/multi-view/turbo","name":"Hunyuan3D","created_by":"fal","source":"official","description":"Generate 3D models from your images using Hunyuan 3D.","status":"active","release_date":"2025-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d/v2/multi-view/turbo","tagline":"Generate 3D models from your images using Hunyuan 3D.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan3d/v2/multi-view","name":"Hunyuan3D","created_by":"fal","source":"official","description":"Generate 3D models from your images using Hunyuan 3D.","status":"active","release_date":"2025-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d/v2/multi-view","tagline":"Generate 3D models from your images using Hunyuan 3D.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan3d/v2/turbo","name":"Hunyuan3D","created_by":"fal","source":"official","description":"Generate 3D models from your images using Hunyuan 3D.","status":"active","release_date":"2025-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d/v2/turbo","tagline":"Generate 3D models from your images using Hunyuan 3D.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan3d/v2","name":"Hunyuan3D","created_by":"fal","source":"official","description":"Generate 3D models from your images using Hunyuan 3D.","status":"active","release_date":"2025-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d/v2","tagline":"Generate 3D models from your images using Hunyuan 3D.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan3d-v3/image-to-3d","name":"Hunyuan3d V3","created_by":"fal","source":"official","description":"Transform your photos into ultra-high-resolution 3D models in seconds.","status":"active","release_date":"2025-12-16","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d-v3/image-to-3d","tagline":"Transform your photos into ultra-high-resolution 3D models in seconds.","capabilities":{"vision":true},"last_seen_at":"2026-06-02","last_updated":"2026-06-03"},{"id":"fal-ai/hunyuan3d-v3/sketch-to-3d","name":"Hunyuan3d V3","created_by":"fal","source":"official","description":"Create your imagined 3D models with just text.","status":"active","release_date":"2025-12-16","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d-v3/sketch-to-3d","tagline":"Create your imagined 3D models with just text.","capabilities":{"vision":true},"last_seen_at":"2026-06-02","last_updated":"2026-06-03"},{"id":"fal-ai/hunyuan3d-v3/text-to-3d","name":"Hunyuan3d V3","created_by":"fal","source":"official","description":"Turn simple sketches into detailed, fully-textured 3D models.","status":"active","release_date":"2025-12-16","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d-v3/text-to-3d","tagline":"Turn simple sketches into detailed, fully-textured 3D models.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan_world/image-to-world","name":"Hunyuan World","created_by":"fal","source":"official","description":"Hunyuan World 1.0 turns a single image into a panorama or a 3D world.","status":"active","release_date":"2025-07-28","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan_world/image-to-world","tagline":"Hunyuan World 1.0 turns a single image into a panorama or a 3D world.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hunyuan_world","name":"Hunyuan World","created_by":"fal","source":"official","description":"Hunyuan World 1.0 turns a single image into a panorama or a 3D world.","status":"active","release_date":"2025-07-28","model_type":"image","page_url":"https://fal.run/fal-ai/hunyuan_world","tagline":"Hunyuan World 1.0 turns a single image into a panorama or a 3D world.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hy-wu-edit","name":"Hy Wu Edit","created_by":"fal","source":"official","description":"Image editing with HY-WU.","status":"active","release_date":"2026-03-25","model_type":"image","page_url":"https://fal.run/fal-ai/hy-wu-edit","tagline":"Image editing with HY-WU.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/hyper-sdxl/image-to-image","name":"Hyper SDXL","created_by":"fal","source":"official","description":"Hyper-charge SDXL's performance and creativity.","status":"active","release_date":"2024-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/hyper-sdxl/image-to-image","tagline":"Hyper-charge SDXL's performance and creativity.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/hyper-sdxl/inpainting","name":"Hyper SDXL","created_by":"fal","source":"official","description":"Hyper-charge SDXL's performance and creativity.","status":"active","release_date":"2024-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/hyper-sdxl/inpainting","tagline":"Hyper-charge SDXL's performance and creativity.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/hyper-sdxl","name":"Hyper SDXL","created_by":"fal","source":"official","description":"Hyper-charge SDXL's performance and creativity.","status":"active","release_date":"2024-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/hyper-sdxl","tagline":"Hyper-charge SDXL's performance and creativity.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/hyper3d/rodin/v2.5/fast","name":"Hyper3D - Rodin V2.5 - Image to 3D - Fast","created_by":"fal","source":"official","description":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","status":"active","release_date":"2026-06-05","model_type":"other","page_url":"https://fal.run/fal-ai/hyper3d/rodin/v2.5/fast","tagline":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hyper3d/rodin/v2.5/text-to-3d/fast","name":"Hyper3D - Rodin V2.5 - Text to 3D - Fast","created_by":"fal","source":"official","description":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","status":"active","release_date":"2026-06-05","model_type":"other","page_url":"https://fal.run/fal-ai/hyper3d/rodin/v2.5/text-to-3d/fast","tagline":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hyper3d/rodin/v2.5/text-to-3d","name":"Hyper3D - Rodin V2.5 - Text to 3D","created_by":"fal","source":"official","description":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","status":"active","release_date":"2026-05-28","model_type":"other","page_url":"https://fal.run/fal-ai/hyper3d/rodin/v2.5/text-to-3d","tagline":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hyper3d/rodin/v2.5","name":"Hyper3D - Rodin V2.5 - Image to 3D","created_by":"fal","source":"official","description":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","status":"active","release_date":"2026-05-28","model_type":"other","page_url":"https://fal.run/fal-ai/hyper3d/rodin/v2.5","tagline":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hyper3d/rodin/v2","name":"Hyper3d","created_by":"fal","source":"official","description":"Rodin by Hyper3D generates realistic and production ready 3D models from text or images.","status":"active","release_date":"2025-09-26","model_type":"other","page_url":"https://fal.run/fal-ai/hyper3d/rodin/v2","tagline":"Rodin by Hyper3D generates realistic and production ready 3D models from text or images.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hyper3d/rodin","name":"Hyper3D Rodin","created_by":"fal","source":"official","description":"Rodin by Hyper3D generates realistic and production ready 3D models from text or images.","status":"active","release_date":"2024-12-16","model_type":"other","page_url":"https://fal.run/fal-ai/hyper3d/rodin","tagline":"Rodin by Hyper3D generates realistic and production ready 3D models from text or images.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/iclight-v2","name":"IC-Light-v2 for Image Relighting","created_by":"fal","source":"official","description":"An endpoint for re-lighting photos and changing their backgrounds per a given description","status":"active","release_date":"2024-11-14","model_type":"image","page_url":"https://fal.run/fal-ai/iclight-v2","tagline":"An endpoint for re-lighting photos and changing their backgrounds per a given description","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/character/edit","name":"Ideogram V3 Character Edit","created_by":"fal","source":"official","description":"Modify consistent characters while preserving their core identity.","status":"active","release_date":"2025-08-07","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/character/edit","tagline":"Modify consistent characters while preserving their core identity.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/character/remix","name":"Ideogram V3 Character Remix","created_by":"fal","source":"official","description":"Transform your consistent character into different art styles, settings, or scenarios while maintaining their distinctive appearance and identity","status":"active","release_date":"2025-08-07","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/character/remix","tagline":"Transform your consistent character into different art styles, settings, or scenarios while maintaining their distinctive appearance and identity","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/character","name":"Ideogram V3 Character","created_by":"fal","source":"official","description":"Generate consistent character appearances across multiple images.","status":"active","release_date":"2025-08-07","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/character","tagline":"Generate consistent character appearances across multiple images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/custom-models/generate","name":"Ideogram","created_by":"fal","source":"official","description":"Train Ideogram on your photos, your style, your subject, your look, from a small set of reference images to images that feel consistently yours ","status":"active","release_date":"2026-04-22","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/custom-models/generate","tagline":"Train Ideogram on your photos, your style, your subject, your look, from a small set of reference images to images that feel consistently yours ","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/custom-models","name":"Ideogram","created_by":"fal","source":"official","description":"Train Ideogram on your photos, your style, your subject, your look, from a small set of reference images to images that feel consistently yours ","status":"active","release_date":"2026-04-22","model_type":"other","page_url":"https://fal.run/fal-ai/ideogram/custom-models","tagline":"Train Ideogram on your photos, your style, your subject, your look, from a small set of reference images to images that feel consistently yours ","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/remove-background","name":"Ideogram Remove Background","created_by":"fal","source":"official","description":"Remove backgrounds from existing images with Ideogram's remove background feature.","status":"active","release_date":"2026-05-07","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/remove-background","tagline":"Remove backgrounds from existing images with Ideogram's remove background feature.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-13","last_updated":"2026-06-03"},{"id":"fal-ai/ideogram/upscale","name":"Ideogram Upscale","created_by":"fal","source":"official","description":"Ideogram Upscale enhances the resolution of the reference image by up to 2X and might enhance the reference image too.","status":"active","release_date":"2025-02-10","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/upscale","tagline":"Ideogram Upscale enhances the resolution of the reference image by up to 2X and might enhance the reference image too.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2/edit","name":"Ideogram V2 Edit","created_by":"fal","source":"official","description":"Transform existing images with Ideogram V2's editing capabilities.","status":"active","release_date":"2024-12-14","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2/edit","tagline":"Transform existing images with Ideogram V2's editing capabilities.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2/remix","name":"Ideogram V2 Remix","created_by":"fal","source":"official","description":"Reimagine existing images with Ideogram V2's remix feature.","status":"active","release_date":"2024-12-04","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2/remix","tagline":"Reimagine existing images with Ideogram V2's remix feature.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2/turbo/edit","name":"Ideogram V2 Turbo Edit","created_by":"fal","source":"official","description":"Edit images faster with Ideogram V2 Turbo.","status":"active","release_date":"2024-12-04","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2/turbo/edit","tagline":"Edit images faster with Ideogram V2 Turbo.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2/turbo/remix","name":"Ideogram V2 Turbo Remix","created_by":"fal","source":"official","description":"Rapidly create image variations with Ideogram V2 Turbo Remix.","status":"active","release_date":"2024-12-04","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2/turbo/remix","tagline":"Rapidly create image variations with Ideogram V2 Turbo Remix.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2/turbo","name":"Ideogram V2 Turbo","created_by":"fal","source":"official","description":"Accelerated image generation with Ideogram V2 Turbo.","status":"active","release_date":"2024-12-04","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2/turbo","tagline":"Accelerated image generation with Ideogram V2 Turbo.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2","name":"Ideogram V2","created_by":"fal","source":"official","description":"Generate high-quality images, posters, and logos with Ideogram V2.","status":"active","release_date":"2024-12-04","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2","tagline":"Generate high-quality images, posters, and logos with Ideogram V2.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/v2a/remix","name":"Ideogram V2A Remix","created_by":"fal","source":"official","description":"Create variations of existing images with Ideogram V2A Remix while maintaining creative control through prompt guidance.","status":"active","release_date":"2025-02-27","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2a/remix","tagline":"Create variations of existing images with Ideogram V2A Remix while maintaining creative control through prompt guidance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2a/turbo/remix","name":"Ideogram V2A Turbo Remix","created_by":"fal","source":"official","description":"Rapidly create image variations with Ideogram V2A Turbo Remix.","status":"active","release_date":"2025-02-27","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2a/turbo/remix","tagline":"Rapidly create image variations with Ideogram V2A Turbo Remix.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2a/turbo","name":"Ideogram V2A Turbo","created_by":"fal","source":"official","description":"Accelerated image generation with Ideogram V2A Turbo.","status":"active","release_date":"2025-02-27","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2a/turbo","tagline":"Accelerated image generation with Ideogram V2A Turbo.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/v2a","name":"Ideogram V2A","created_by":"fal","source":"official","description":"Generate high-quality images, posters, and logos with Ideogram V2A.","status":"active","release_date":"2025-02-27","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2a","tagline":"Generate high-quality images, posters, and logos with Ideogram V2A.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/v3/edit","name":"Ideogram V3 Edit","created_by":"fal","source":"official","description":"Transform existing images with Ideogram V3's editing capabilities.","status":"active","release_date":"2025-05-01","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v3/edit","tagline":"Transform existing images with Ideogram V3's editing capabilities.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v3/generate-transparent","name":"Ideogram Transparent","created_by":"fal","source":"official","description":"Generate images with transparent backgrounds using Ideogram Transparent model","status":"active","release_date":"2026-04-07","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v3/generate-transparent","tagline":"Generate images with transparent backgrounds using Ideogram Transparent model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v3/layerize-text","name":"Ideogram","created_by":"fal","source":"official","description":"Ideogram Layerize takes an existing flat graphic, removes text, and returns structured text containers you can edit/recompose in html or json format.","status":"active","release_date":"2026-04-07","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v3/layerize-text","tagline":"Ideogram Layerize takes an existing flat graphic, removes text, and returns structured text containers you can edit/recompose in html or json format.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v3/reframe","name":"Ideogram","created_by":"fal","source":"official","description":"Extend existing images with Ideogram V3's reframe feature.","status":"active","release_date":"2025-05-01","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v3/reframe","tagline":"Extend existing images with Ideogram V3's reframe feature.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/v3/remix","name":"Ideogram","created_by":"fal","source":"official","description":"Reimagine existing images with Ideogram V3's remix feature.","status":"active","release_date":"2025-05-01","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v3/remix","tagline":"Reimagine existing images with Ideogram V3's remix feature.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/v3/replace-background","name":"Ideogram Replace Background","created_by":"fal","source":"official","description":"Replace backgrounds existing images with Ideogram V3's replace background feature.","status":"active","release_date":"2025-05-01","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v3/replace-background","tagline":"Replace backgrounds existing images with Ideogram V3's replace background feature.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/v3","name":"Ideogram Text to Image","created_by":"fal","source":"official","description":"Generate high-quality images, posters, and logos with Ideogram V3.","status":"active","release_date":"2025-05-01","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v3","tagline":"Generate high-quality images, posters, and logos with Ideogram V3.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/illusion-diffusion","name":"Illusion Diffusion","created_by":"fal","source":"official","description":"Create illusions conditioned on image.","status":"active","release_date":"2024-02-13","model_type":"image","page_url":"https://fal.run/fal-ai/illusion-diffusion","tagline":"Create illusions conditioned on image.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/age-modify","name":"Age Modify","created_by":"fal","source":"official","description":"Modify a face to look younger or older while keeping identity realistic.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/age-modify","tagline":"Modify a face to look younger or older while keeping identity realistic.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-apps-v2/city-teleport","name":"City Teleport","created_by":"fal","source":"official","description":"Place a person’s photo into iconic cities worldwide.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/city-teleport","tagline":"Place a person’s photo into iconic cities worldwide.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-apps-v2/expression-change","name":"Expression Change","created_by":"fal","source":"official","description":"Change facial expressions in photos with realistic results.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/expression-change","tagline":"Change facial expressions in photos with realistic results.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-apps-v2/hair-change","name":"Hair Change","created_by":"fal","source":"official","description":"Change hairstyles and hair colors in photos realistically.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/hair-change","tagline":"Change hairstyles and hair colors in photos realistically.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-apps-v2/headshot-photo","name":"Headshot Generator","created_by":"fal","source":"official","description":"Generate professional headshot photos with customizable backgrounds.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/headshot-photo","tagline":"Generate professional headshot photos with customizable backgrounds.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-apps-v2/makeup-application","name":"Makeup Changer","created_by":"fal","source":"official","description":"Apply realistic makeup styles with adjustable intensity.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/makeup-application","tagline":"Apply realistic makeup styles with adjustable intensity.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-apps-v2/object-removal","name":"Object Removal","created_by":"fal","source":"official","description":"Remove unwanted objects seamlessly from any image.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/object-removal","tagline":"Remove unwanted objects seamlessly from any image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-apps-v2/outpaint","name":"Image Outpaint","created_by":"fal","source":"official","description":"Directional outpainting.","status":"active","release_date":"2025-11-03","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/outpaint","tagline":"Directional outpainting.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/perspective","name":"Perspective Change","created_by":"fal","source":"official","description":"Easily adjust the perspective of any image to different angles.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/perspective","tagline":"Easily adjust the perspective of any image to different angles.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/photo-restoration","name":"Photo Restoration","created_by":"fal","source":"official","description":"Restore old or damaged photos by fixing colors, scratches, and resolution.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/photo-restoration","tagline":"Restore old or damaged photos by fixing colors, scratches, and resolution.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/photography-effects","name":"Photography Effects","created_by":"fal","source":"official","description":"Apply diverse photography styles and effects to transform your images.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/photography-effects","tagline":"Apply diverse photography styles and effects to transform your images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/portrait-enhance","name":"Portrait Enhance","created_by":"fal","source":"official","description":"Enhance and refine portrait photos with improved clarity and detail.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/portrait-enhance","tagline":"Enhance and refine portrait photos with improved clarity and detail.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/product-holding","name":"Product Holding","created_by":"fal","source":"official","description":"Place products naturally in a person’s hands for realistic marketing visuals.","status":"active","release_date":"2025-09-19","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/product-holding","tagline":"Place products naturally in a person’s hands for realistic marketing visuals.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/product-photography","name":"Product Photography","created_by":"fal","source":"official","description":"Generate professional product photography with realistic lighting and backgrounds.","status":"active","release_date":"2025-09-19","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/product-photography","tagline":"Generate professional product photography with realistic lighting and backgrounds.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/relighting","name":"Relighting","created_by":"fal","source":"official","description":"Adjust and enhance images with different lighting styles.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/relighting","tagline":"Adjust and enhance images with different lighting styles.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/style-transfer","name":"Style Transfer","created_by":"fal","source":"official","description":"Apply artistic styles like impressionism, cubism, or surrealism to your images.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/style-transfer","tagline":"Apply artistic styles like impressionism, cubism, or surrealism to your images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/texture-transform","name":"Texture Transform","created_by":"fal","source":"official","description":"Transform objects with different surface textures like marble, wood, or fabric.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/texture-transform","tagline":"Transform objects with different surface textures like marble, wood, or fabric.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/virtual-try-on","name":"Virtual Try-on","created_by":"fal","source":"official","description":"Try on clothes virtually by combining person and clothing images.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/virtual-try-on","tagline":"Try on clothes virtually by combining person and clothing images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-editing/age-progression","name":"Image Editing Age Progression","created_by":"fal","source":"official","description":"See how you or others might look at different ages, from younger to older, while preserving core facial features.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/age-progression","tagline":"See how you or others might look at different ages, from younger to older, while preserving core facial features.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/baby-version","name":"Image Editing","created_by":"fal","source":"official","description":"Transform any person into their baby version, while preserving the original pose and expression with childlike features.","status":"active","release_date":"2025-06-03","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/baby-version","tagline":"Transform any person into their baby version, while preserving the original pose and expression with childlike features.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-editing/background-change","name":"Image Editing Background Change","created_by":"fal","source":"official","description":"Replace your photo's background with any scene you desire, from beach sunsets to urban landscapes, with perfect lighting and shadows","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/background-change","tagline":"Replace your photo's background with any scene you desire, from beach sunsets to urban landscapes, with perfect lighting and shadows","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/broccoli-haircut","name":"Image Editing Broccoli Haircut","created_by":"fal","source":"official","description":"Transform your character's hair into broccoli style while keeping the original characters likeness","status":"active","release_date":"2025-06-26","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/broccoli-haircut","tagline":"Transform your character's hair into broccoli style while keeping the original characters likeness","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-editing/cartoonify","name":"Image Editing Cartoonify","created_by":"fal","source":"official","description":"Transform your photos into vibrant cool cartoons with bold outlines and rich colors.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/cartoonify","tagline":"Transform your photos into vibrant cool cartoons with bold outlines and rich colors.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/color-correction","name":"Image Editing Color Correction","created_by":"fal","source":"official","description":"Perfect your photos with professional color grading, balanced tones, and vibrant yet natural colors","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/color-correction","tagline":"Perfect your photos with professional color grading, balanced tones, and vibrant yet natural colors","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/expression-change","name":"Image Editing Expression Change","created_by":"fal","source":"official","description":"Change facial expressions in photos to any emotion you desire, from smiles to serious looks.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/expression-change","tagline":"Change facial expressions in photos to any emotion you desire, from smiles to serious looks.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/face-enhancement","name":"Image Editing Face Enhancement","created_by":"fal","source":"official","description":"Enhance facial features with professional retouching while maintaining a natural, realistic look","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/face-enhancement","tagline":"Enhance facial features with professional retouching while maintaining a natural, realistic look","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/hair-change","name":"Image Editing Hair Change","created_by":"fal","source":"official","description":"Experiment with different hairstyles, from bald to any style you can imagine, while maintaining natural lighting and realistic results.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/hair-change","tagline":"Experiment with different hairstyles, from bald to any style you can imagine, while maintaining natural lighting and realistic results.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/object-removal","name":"Image Editing Object Removal","created_by":"fal","source":"official","description":"Remove unwanted objects or people from your photos while seamlessly blending the background.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/object-removal","tagline":"Remove unwanted objects or people from your photos while seamlessly blending the background.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-01","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/photo-restoration","name":"Image Editing Photo Restoration","created_by":"fal","source":"official","description":"Restore and enhance old or damaged photos by removing imperfections, adding color while preserving the original character and details of the image.","status":"active","release_date":"2025-06-02","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/photo-restoration","tagline":"Restore and enhance old or damaged photos by removing imperfections, adding color while preserving the original character and details of the image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/plushie-style","name":"Image Editing Plushie Style","created_by":"fal","source":"official","description":"Transform your photos into cool plushies while keeping the original characters likeness","status":"active","release_date":"2025-06-26","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/plushie-style","tagline":"Transform your photos into cool plushies while keeping the original characters likeness","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/professional-photo","name":"Image Editing Professional Photo","created_by":"fal","source":"official","description":"Turn your casual photos into stunning professional studio portraits with perfect lighting and high-end photography style.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/professional-photo","tagline":"Turn your casual photos into stunning professional studio portraits with perfect lighting and high-end photography style.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/realism","name":"Image Editing Realism","created_by":"fal","source":"official","description":"Add details to faces, enhance face features, remove blur.","status":"active","release_date":"2025-07-07","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/realism","tagline":"Add details to faces, enhance face features, remove blur.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/reframe","name":"Image Editing Reframe","created_by":"fal","source":"official","description":"The reframe endpoint intelligently adjusts an image's aspect ratio while preserving the main subject's position, composition, pose, and perspective","status":"active","release_date":"2025-06-05","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/reframe","tagline":"The reframe endpoint intelligently adjusts an image's aspect ratio while preserving the main subject's position, composition, pose, and perspective","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/retouch","name":"Image Editing Retouch","created_by":"fal","source":"official","description":"Retouch photos of faces.","status":"active","release_date":"2025-07-24","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/retouch","tagline":"Retouch photos of faces.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/scene-composition","name":"Image Editing Scene Composition","created_by":"fal","source":"official","description":"Place your subject in any scene you imagine, from enchanted forests to urban settings, with professional composition and lighting","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/scene-composition","tagline":"Place your subject in any scene you imagine, from enchanted forests to urban settings, with professional composition and lighting","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/style-transfer","name":"Image Editing Style Transfer","created_by":"fal","source":"official","description":"Transform your photos into artistic masterpieces inspired by famous styles like Van Gogh's Starry Night or any artistic style you choose.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/style-transfer","tagline":"Transform your photos into artistic masterpieces inspired by famous styles like Van Gogh's Starry Night or any artistic style you choose.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/text-removal","name":"Image Editing Text Removal","created_by":"fal","source":"official","description":"Remove all text and writing from images while preserving the background and natural appearance.","status":"active","release_date":"2025-06-02","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/text-removal","tagline":"Remove all text and writing from images while preserving the background and natural appearance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/time-of-day","name":"Image Editing Time Of Day","created_by":"fal","source":"official","description":"Transform your photos to any time of day, from golden hour to midnight, with appropriate lighting and atmosphere.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/time-of-day","tagline":"Transform your photos to any time of day, from golden hour to midnight, with appropriate lighting and atmosphere.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/weather-effect","name":"Image Editing Weather Effect","created_by":"fal","source":"official","description":"Add realistic weather effects like snowfall, rain, or fog to your photos while maintaining the scene's mood.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/weather-effect","tagline":"Add realistic weather effects like snowfall, rain, or fog to your photos while maintaining the scene's mood.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/wojak-style","name":"Image Editing Wojak Style","created_by":"fal","source":"official","description":"Transform your photos into wojak style while keeping the original characters likeness","status":"active","release_date":"2025-06-26","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/wojak-style","tagline":"Transform your photos into wojak style while keeping the original characters likeness","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/youtube-thumbnails","name":"Image Editing Youtube Thumbnails","created_by":"fal","source":"official","description":"Generate YouTube thumbnails with custom text","status":"active","release_date":"2025-06-30","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/youtube-thumbnails","tagline":"Generate YouTube thumbnails with custom text","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-preprocessors/depth-anything/v2","name":"Image Preprocessors","created_by":"fal","source":"official","description":"Depth Anything v2 preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/depth-anything/v2","tagline":"Depth Anything v2 preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/hed","name":"Image Preprocessors","created_by":"fal","source":"official","description":"Holistically-Nested Edge Detection (HED) preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/hed","tagline":"Holistically-Nested Edge Detection (HED) preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/lineart","name":"Image Preprocessors","created_by":"fal","source":"official","description":"Line art preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/lineart","tagline":"Line art preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/midas","name":"Image Preprocessors","created_by":"fal","source":"official","description":"MiDaS depth estimation preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/midas","tagline":"MiDaS depth estimation preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/mlsd","name":"Image Preprocessors","created_by":"fal","source":"official","description":"M-LSD line segment detection preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/mlsd","tagline":"M-LSD line segment detection preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/pidi","name":"Image Preprocessors","created_by":"fal","source":"official","description":"PIDI (Pidinet) preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/pidi","tagline":"PIDI (Pidinet) preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/sam","name":"Image Preprocessors","created_by":"fal","source":"official","description":"Segment Anything Model (SAM) preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/sam","tagline":"Segment Anything Model (SAM) preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/scribble","name":"Image Preprocessors","created_by":"fal","source":"official","description":"Scribble preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/scribble","tagline":"Scribble preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/teed","name":"Image Preprocessors","created_by":"fal","source":"official","description":"TEED (Temporal Edge Enhancement Detection) preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/teed","tagline":"TEED (Temporal Edge Enhancement Detection) preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/zoe","name":"Image Preprocessors","created_by":"fal","source":"official","description":"ZoeDepth preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/zoe","tagline":"ZoeDepth preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image2pixel","name":"Image2Pixel","created_by":"fal","source":"official","description":"Turn images into pixel-perfect retro art","status":"active","release_date":"2025-10-14","model_type":"image","page_url":"https://fal.run/fal-ai/image2pixel","tagline":"Turn images into pixel-perfect retro art","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image2svg","name":"Image2svg","created_by":"fal","source":"official","description":"Image2SVG transforms raster images into clean vector graphics, preserving visual quality while enabling scalable, customizable SVG outputs with precise control over detail levels.","status":"active","release_date":"2025-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/image2svg","tagline":"Image2SVG transforms raster images into clean vector graphics, preserving visual quality while enabling scalable, customizable SVG outputs with precise control over detail levels.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/imagen3/fast","name":"Imagen3 Fast","created_by":"fal","source":"official","family":"imagen","description":"Imagen3 Fast is a high-quality text-to-image model that generates realistic images from text prompts.","status":"active","release_date":"2025-02-10","model_type":"image","page_url":"https://fal.run/fal-ai/imagen3/fast","tagline":"Imagen3 Fast is a high-quality text-to-image model that generates realistic images from text prompts.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/imagen3","name":"Imagen3","created_by":"fal","source":"official","family":"imagen","description":"Imagen3 is a high-quality text-to-image model that generates realistic images from text prompts.","status":"active","release_date":"2025-02-10","model_type":"image","page_url":"https://fal.run/fal-ai/imagen3","tagline":"Imagen3 is a high-quality text-to-image model that generates realistic images from text prompts.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/imagen4/preview/fast","name":"Imagen 4","created_by":"fal","source":"official","family":"imagen","description":"Google’s highest quality image generation model","status":"active","release_date":"2025-06-12","model_type":"image","page_url":"https://fal.run/fal-ai/imagen4/preview/fast","tagline":"Google’s highest quality image generation model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/imagen4/preview/ultra","name":"Imagen 4 Ultra","created_by":"fal","source":"official","family":"imagen","description":"Google’s highest quality image generation model","status":"active","release_date":"2025-05-20","model_type":"image","page_url":"https://fal.run/fal-ai/imagen4/preview/ultra","tagline":"Google’s highest quality image generation model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/imagen4/preview","name":"Imagen 4","created_by":"fal","source":"official","family":"imagen","description":"Google’s highest quality image generation model","status":"active","release_date":"2025-05-20","model_type":"image","page_url":"https://fal.run/fal-ai/imagen4/preview","tagline":"Google’s highest quality image generation model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/imageutils/depth","name":"Midas Depth Estimation","created_by":"fal","source":"official","description":"Create depth maps using Midas depth estimation.","status":"active","release_date":"2024-02-13","model_type":"image","page_url":"https://fal.run/fal-ai/imageutils/depth","tagline":"Create depth maps using Midas depth estimation.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/imageutils/marigold-depth","name":"Marigold Depth Estimation","created_by":"fal","source":"official","description":"Create depth maps using Marigold depth estimation.","status":"active","release_date":"2023-12-28","model_type":"image","page_url":"https://fal.run/fal-ai/imageutils/marigold-depth","tagline":"Create depth maps using Marigold depth estimation.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/imageutils/nsfw","name":"NSFW Filter","created_by":"fal","source":"official","description":"Predict the probability of an image being NSFW.","status":"active","release_date":"2024-03-22","model_type":"other","page_url":"https://fal.run/fal-ai/imageutils/nsfw","tagline":"Predict the probability of an image being NSFW.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/imageutils/rembg","name":"Remove Background","created_by":"fal","source":"official","description":"Remove the background from an image.","status":"active","release_date":"2023-10-05","model_type":"image","page_url":"https://fal.run/fal-ai/imageutils/rembg","tagline":"Remove the background from an image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/index-tts-2/text-to-speech","name":"Index TTS 2.0","created_by":"fal","source":"official","description":"Generate natural, clear speeches using Index TTS 2.0 from IndexTeam","status":"active","release_date":"2025-10-07","model_type":"tts","page_url":"https://fal.run/fal-ai/index-tts-2/text-to-speech","tagline":"Generate natural, clear speeches using Index TTS 2.0 from IndexTeam","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/infinitalk/single-text","name":"Infinitalk","created_by":"fal","source":"official","description":"Infinitalk model generates a talking avatar video from a text and audio file.","status":"active","release_date":"2025-08-22","model_type":"video","page_url":"https://fal.run/fal-ai/infinitalk/single-text","tagline":"Infinitalk model generates a talking avatar video from a text and audio file.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/infinitalk/video-to-video","name":"Infinitalk","created_by":"fal","source":"official","description":"Infinitalk model generates a talking avatar video from an image and audio file.","status":"active","release_date":"2025-09-22","model_type":"other","page_url":"https://fal.run/fal-ai/infinitalk/video-to-video","tagline":"Infinitalk model generates a talking avatar video from an image and audio file.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/infinitalk","name":"Infinitalk","created_by":"fal","source":"official","description":"Infinitalk model generates a talking avatar video from an image and audio file.","status":"active","release_date":"2025-08-21","model_type":"other","page_url":"https://fal.run/fal-ai/infinitalk","tagline":"Infinitalk model generates a talking avatar video from an image and audio file.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/infinity-star/text-to-video","name":"Infinity Star","created_by":"fal","source":"official","description":"InfinityStar’s unified 8B spacetime autoregressive engine to turn any text prompt into crisp 720p videos - 10× faster than diffusion models.","status":"active","release_date":"2025-11-07","model_type":"video","page_url":"https://fal.run/fal-ai/infinity-star/text-to-video","tagline":"InfinityStar’s unified 8B spacetime autoregressive engine to turn any text prompt into crisp 720p videos - 10× faster than diffusion models.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/inpaint","name":"Inpainting sdxl and sd","created_by":"fal","source":"official","description":"Inpaint images with SD and SDXL","status":"active","release_date":"2023-11-04","model_type":"image","page_url":"https://fal.run/fal-ai/inpaint","tagline":"Inpaint images with SD and SDXL","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/instant-character","name":"Instant Character","created_by":"fal","source":"official","description":"InstantCharacter creates high-quality, consistent characters from text prompts, supporting diverse poses, styles, and appearances with strong identity control.","status":"active","release_date":"2025-04-18","model_type":"image","page_url":"https://fal.run/fal-ai/instant-character","tagline":"InstantCharacter creates high-quality, consistent characters from text prompts, supporting diverse poses, styles, and appearances with strong identity control.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/invisible-watermark","name":"Invisible Watermark","created_by":"fal","source":"official","description":"Invisible Watermark is a model that can add an invisible watermark to an image.","status":"active","release_date":"2025-03-14","model_type":"image","page_url":"https://fal.run/fal-ai/invisible-watermark","tagline":"Invisible Watermark is a model that can add an invisible watermark to an image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/inworld-tts","name":"Inworld TTS-1.5 Max","created_by":"fal","source":"official","description":"Text to Speech Endpoint for Inworld's TTS-1.5 Max.","status":"active","release_date":"2026-03-13","model_type":"tts","page_url":"https://fal.run/fal-ai/inworld-tts","tagline":"Text to Speech Endpoint for Inworld's TTS-1.5 Max.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/ip-adapter-face-id","name":"IP Adapter Face ID","created_by":"fal","source":"official","description":"High quality zero-shot personalization","status":"active","release_date":"2024-04-22","model_type":"image","page_url":"https://fal.run/fal-ai/ip-adapter-face-id","tagline":"High quality zero-shot personalization","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/janus","name":"DeepSeek Janus-Pro","created_by":"fal","source":"official","description":"DeepSeek Janus-Pro is a novel text-to-image model that unifies multimodal understanding and generation through an autoregressive framework","status":"active","release_date":"2025-01-28","model_type":"image","page_url":"https://fal.run/fal-ai/janus","tagline":"DeepSeek Janus-Pro is a novel text-to-image model that unifies multimodal understanding and generation through an autoregressive framework","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/joyai-image-edit","name":"Joyai Image Edit","created_by":"fal","source":"official","description":"All-in-one image AI with JoyAI-Image.","status":"active","release_date":"2026-04-06","model_type":"image","page_url":"https://fal.run/fal-ai/joyai-image-edit","tagline":"All-in-one image AI with JoyAI-Image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/kandinsky5-pro/image-to-video","name":"Kandinsky5 Pro","created_by":"fal","source":"official","description":"Kandinsky 5.0 Pro is a diffusion model for fast, high-quality image-to-video generation.","status":"active","release_date":"2025-12-23","model_type":"video","page_url":"https://fal.run/fal-ai/kandinsky5-pro/image-to-video","tagline":"Kandinsky 5.0 Pro is a diffusion model for fast, high-quality image-to-video generation.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kandinsky5-pro/text-to-video","name":"Kandinsky5 Pro","created_by":"fal","source":"official","description":"Kandinsky 5.0 Pro is a diffusion model for fast, high-quality text-to-video generation.","status":"active","release_date":"2025-12-23","model_type":"video","page_url":"https://fal.run/fal-ai/kandinsky5-pro/text-to-video","tagline":"Kandinsky 5.0 Pro is a diffusion model for fast, high-quality text-to-video generation.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kandinsky5/text-to-video/distill","name":"Kandinsky5","created_by":"fal","source":"official","description":"Kandinsky 5.0 Distilled is a lightweight diffusion model for fast, high-quality text-to-video generation.","status":"active","release_date":"2025-10-13","model_type":"video","page_url":"https://fal.run/fal-ai/kandinsky5/text-to-video/distill","tagline":"Kandinsky 5.0 Distilled is a lightweight diffusion model for fast, high-quality text-to-video generation.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kandinsky5/text-to-video","name":"Kandinsky5","created_by":"fal","source":"official","description":"Kandinsky 5.0 is a diffusion model for fast, high-quality text-to-video generation.","status":"active","release_date":"2025-10-13","model_type":"video","page_url":"https://fal.run/fal-ai/kandinsky5/text-to-video","tagline":"Kandinsky 5.0 is a diffusion model for fast, high-quality text-to-video generation.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kling-image/o1","name":"Kling O1 Image","created_by":"fal","source":"official","description":"Perform precise image edits using strong reference control, transforming subjects, styles, and local details while preserving visual consistency.","status":"active","release_date":"2025-12-01","model_type":"image","page_url":"https://fal.run/fal-ai/kling-image/o1","tagline":"Perform precise image edits using strong reference control, transforming subjects, styles, and local details while preserving visual consistency.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-image/o3/image-to-image","name":"Kling Image","created_by":"fal","source":"official","description":"Kling Omni 3: Top-tier image-to-image with flawless consistency.","status":"active","release_date":"2026-02-03","model_type":"image","page_url":"https://fal.run/fal-ai/kling-image/o3/image-to-image","tagline":"Kling Omni 3: Top-tier image-to-image with flawless consistency.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-image/o3/text-to-image","name":"Kling Image","created_by":"fal","source":"official","description":"Kling Omni 3: Top-tier text-to-image with flawless consistency.","status":"active","release_date":"2026-02-03","model_type":"image","page_url":"https://fal.run/fal-ai/kling-image/o3/text-to-image","tagline":"Kling Omni 3: Top-tier text-to-image with flawless consistency.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-image/v3/image-to-image","name":"Kling Image","created_by":"fal","source":"official","description":"Kling Image V3: Latest kling image model","status":"active","release_date":"2026-02-03","model_type":"image","page_url":"https://fal.run/fal-ai/kling-image/v3/image-to-image","tagline":"Kling Image V3: Latest kling image model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-image/v3/text-to-image","name":"Kling Image","created_by":"fal","source":"official","description":"Kling V3: Latest Kling Image model","status":"active","release_date":"2026-02-03","model_type":"image","page_url":"https://fal.run/fal-ai/kling-image/v3/text-to-image","tagline":"Kling V3: Latest Kling Image model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling/v1-5/kolors-virtual-try-on","name":"Kling Kolors Virtual TryOn v1.5","created_by":"fal","source":"official","description":"Kling Kolors Virtual TryOn v1.5 is a high quality image based Try-On endpoint which can be used for commercial try on.","status":"active","release_date":"2025-01-23","model_type":"image","page_url":"https://fal.run/fal-ai/kling/v1-5/kolors-virtual-try-on","tagline":"Kling Kolors Virtual TryOn v1.5 is a high quality image based Try-On endpoint which can be used for commercial try on.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/ai-avatar/v2/pro","name":"Kling AI Avatar v2 Pro","created_by":"fal","source":"official","description":"Kling AI Avatar v2 Pro: The premium endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","status":"active","release_date":"2025-12-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/ai-avatar/v2/pro","tagline":"Kling AI Avatar v2 Pro: The premium endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/ai-avatar/v2/standard","name":"Kling AI Avatar v2 Standard","created_by":"fal","source":"official","description":"Kling AI Avatar v2 Standard: Endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","status":"active","release_date":"2025-12-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/ai-avatar/v2/standard","tagline":"Kling AI Avatar v2 Standard: Endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/create-voice","name":"Kling Video Create Voice","created_by":"fal","source":"official","description":"Create Voices to be used with Kling Models Voice Control","status":"active","release_date":"2025-12-16","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/create-voice","tagline":"Create Voices to be used with Kling Models Voice Control","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/lipsync/audio-to-video","name":"Kling LipSync Audio-to-Video","created_by":"fal","source":"official","description":"Kling LipSync is an audio-to-video model that generates realistic lip movements from audio input.","status":"active","release_date":"2025-03-27","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/lipsync/audio-to-video","tagline":"Kling LipSync is an audio-to-video model that generates realistic lip movements from audio input.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/lipsync/text-to-video","name":"Kling LipSync Text-to-Video","created_by":"fal","source":"official","description":"Kling LipSync is a text-to-video model that generates realistic lip movements from text input.","status":"active","release_date":"2025-03-27","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/lipsync/text-to-video","tagline":"Kling LipSync is a text-to-video model that generates realistic lip movements from text input.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/o1/image-to-video","name":"Kling O1 First Frame Last Frame to Video [Pro]","created_by":"fal","source":"official","description":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","status":"active","release_date":"2025-12-01","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o1/image-to-video","tagline":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o1/reference-to-video","name":"Kling O1 Reference Image to Video [Pro]","created_by":"fal","source":"official","description":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","status":"active","release_date":"2025-12-01","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o1/reference-to-video","tagline":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o1/standard/image-to-video","name":"Kling O1 First Frame Last Frame to Video [Standard]","created_by":"fal","source":"official","description":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","status":"active","release_date":"2025-12-15","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o1/standard/image-to-video","tagline":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o1/standard/reference-to-video","name":"Kling O1 Reference Image to Video [Standard]","created_by":"fal","source":"official","description":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","status":"active","release_date":"2025-12-15","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o1/standard/reference-to-video","tagline":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o1/standard/video-to-video/edit","name":"Kling O1 Edit Video [Standard]","created_by":"fal","source":"official","description":"Edit an existing video using natural-language instructions, transforming subjects, settings, and style while retaining the original motion structure.","status":"active","release_date":"2025-12-15","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o1/standard/video-to-video/edit","tagline":"Edit an existing video using natural-language instructions, transforming subjects, settings, and style while retaining the original motion structure.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o1/standard/video-to-video/reference","name":"Kling O1 Reference Video to Video [Standard]","created_by":"fal","source":"official","description":"Kling O1 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","status":"active","release_date":"2025-12-15","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o1/standard/video-to-video/reference","tagline":"Kling O1 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o1/video-to-video/edit","name":"Kling O1 Edit Video [Pro]","created_by":"fal","source":"official","description":"Edit an existing video using natural-language instructions, transforming subjects, settings, and style while retaining the original motion structure.","status":"active","release_date":"2025-12-01","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o1/video-to-video/edit","tagline":"Edit an existing video using natural-language instructions, transforming subjects, settings, and style while retaining the original motion structure.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o1/video-to-video/reference","name":"Kling O1 Reference Video to Video [Pro]","created_by":"fal","source":"official","description":"Kling O1 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","status":"active","release_date":"2025-12-01","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o1/video-to-video/reference","tagline":"Kling O1 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/4k/image-to-video","name":"Kling Video","created_by":"fal","source":"official","description":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","status":"active","release_date":"2026-04-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/4k/image-to-video","tagline":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/4k/reference-to-video","name":"Kling Video","created_by":"fal","source":"official","description":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","status":"active","release_date":"2026-04-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/4k/reference-to-video","tagline":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/4k/text-to-video","name":"Kling Video","created_by":"fal","source":"official","description":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","status":"active","release_date":"2026-04-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/4k/text-to-video","tagline":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/pro/image-to-video","name":"Kling O3 Image to Video [Pro]","created_by":"fal","source":"official","description":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/pro/image-to-video","tagline":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/pro/reference-to-video","name":"Kling O3 Reference to Video [Pro]","created_by":"fal","source":"official","description":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/pro/reference-to-video","tagline":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/pro/text-to-video","name":"Kling O3 Text to Video [Pro]","created_by":"fal","source":"official","description":"Generate realistic videos using Kling O3 from Kling Team!","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/pro/text-to-video","tagline":"Generate realistic videos using Kling O3 from Kling Team!","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/pro/video-to-video/edit","name":"Kling O3 Edit Video [Pro]","created_by":"fal","source":"official","description":"Edit videos using Kling O3 from Kling Team!","status":"active","release_date":"2026-02-04","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o3/pro/video-to-video/edit","tagline":"Edit videos using Kling O3 from Kling Team!","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/pro/video-to-video/reference","name":"Kling O3 Reference Video to Video [Pro]","created_by":"fal","source":"official","description":"Kling O3 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","status":"active","release_date":"2026-02-04","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o3/pro/video-to-video/reference","tagline":"Kling O3 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/standard/image-to-video","name":"Kling O3 Image to Video [Pro]","created_by":"fal","source":"official","description":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/standard/image-to-video","tagline":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/standard/reference-to-video","name":"Kling O3 Reference to Video [Standard]","created_by":"fal","source":"official","description":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/standard/reference-to-video","tagline":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/standard/text-to-video","name":"Kling O3 Text to Video [Standard]","created_by":"fal","source":"official","description":"Generate realistic videos using Kling O3 from Kling Team!","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/standard/text-to-video","tagline":"Generate realistic videos using Kling O3 from Kling Team!","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/standard/video-to-video/edit","name":"Kling O3 Edit Video [Standard]","created_by":"fal","source":"official","description":"Edit videos using Kling O3 from Kling Team!","status":"active","release_date":"2026-02-04","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o3/standard/video-to-video/edit","tagline":"Edit videos using Kling O3 from Kling Team!","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/standard/video-to-video/reference","name":"Kling O3 Reference Video to Video [Standard]","created_by":"fal","source":"official","description":"Kling O3 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","status":"active","release_date":"2026-02-04","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o3/standard/video-to-video/reference","tagline":"Kling O3 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v1/pro/ai-avatar","name":"Kling AI Avatar Pro","created_by":"fal","source":"official","description":"Kling AI Avatar Pro: The premium endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","status":"active","release_date":"2025-09-13","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1/pro/ai-avatar","tagline":"Kling AI Avatar Pro: The premium endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1/standard/ai-avatar","name":"Kling AI Avatar","created_by":"fal","source":"official","description":"Kling AI Avatar Standard: Endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","status":"active","release_date":"2025-09-13","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1/standard/ai-avatar","tagline":"Kling AI Avatar Standard: Endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v1/standard/effects","name":"Kling 1.0","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.0","status":"active","release_date":"2025-03-06","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1/standard/effects","tagline":"Generate video clips from your prompts using Kling 1.0","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1/standard/image-to-video","name":"Kling 1.0","created_by":"fal","source":"official","description":"Generate video clips from your images using Kling 1.0","status":"active","release_date":"2024-10-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1/standard/image-to-video","tagline":"Generate video clips from your images using Kling 1.0","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1/standard/text-to-video","name":"Kling 1.0","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.0","status":"active","release_date":"2024-12-03","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1/standard/text-to-video","tagline":"Generate video clips from your prompts using Kling 1.0","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1/tts","name":"Kling TTS","created_by":"fal","source":"official","description":"Generate speech from text prompts and different voices using the Kling TTS model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-09-13","model_type":"tts","page_url":"https://fal.run/fal-ai/kling-video/v1/tts","tagline":"Generate speech from text prompts and different voices using the Kling TTS model, which leverages advanced AI techniques to create high-quality text-to-speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v1.5/pro/effects","name":"Kling 1.5","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.5 (pro)","status":"active","release_date":"2025-03-06","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.5/pro/effects","tagline":"Generate video clips from your prompts using Kling 1.5 (pro)","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1.5/pro/image-to-video","name":"Kling 1.5","created_by":"fal","source":"official","description":"Generate video clips from your images using Kling 1.5 (pro)","status":"active","release_date":"2024-10-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.5/pro/image-to-video","tagline":"Generate video clips from your images using Kling 1.5 (pro)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1.5/pro/text-to-video","name":"Kling 1.5","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.5 (pro)","status":"active","release_date":"2024-11-25","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.5/pro/text-to-video","tagline":"Generate video clips from your prompts using Kling 1.5 (pro)","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1.6/pro/effects","name":"Kling 1.6","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.6 (pro)","status":"active","release_date":"2025-03-06","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/pro/effects","tagline":"Generate video clips from your prompts using Kling 1.6 (pro)","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1.6/pro/elements","name":"Kling 1.6 Elements","created_by":"fal","source":"official","description":"Generate video clips from your multiple image references using Kling 1.6 (pro)","status":"active","release_date":"2025-05-20","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/pro/elements","tagline":"Generate video clips from your multiple image references using Kling 1.6 (pro)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v1.6/pro/image-to-video","name":"Kling 1.6","created_by":"fal","source":"official","description":"Generate video clips from your images using Kling 1.6 (pro)","status":"active","release_date":"2025-01-07","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/pro/image-to-video","tagline":"Generate video clips from your images using Kling 1.6 (pro)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v1.6/pro/text-to-video","name":"Kling 1.6","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.6 (pro)","status":"active","release_date":"2025-02-27","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/pro/text-to-video","tagline":"Generate video clips from your prompts using Kling 1.6 (pro)","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1.6/standard/effects","name":"Kling 1.6","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.6 (std)","status":"active","release_date":"2025-03-06","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/standard/effects","tagline":"Generate video clips from your prompts using Kling 1.6 (std)","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1.6/standard/elements","name":"Kling 1.6 Elements","created_by":"fal","source":"official","description":"Generate video clips from your multiple image references using Kling 1.6 (standard)","status":"active","release_date":"2025-05-20","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/standard/elements","tagline":"Generate video clips from your multiple image references using Kling 1.6 (standard)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v1.6/standard/image-to-video","name":"Kling 1.6","created_by":"fal","source":"official","description":"Generate video clips from your images using Kling 1.6 (std)","status":"active","release_date":"2025-01-07","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/standard/image-to-video","tagline":"Generate video clips from your images using Kling 1.6 (std)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1.6/standard/text-to-video","name":"Kling 1.6","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.6 (std)","status":"active","release_date":"2025-01-07","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/standard/text-to-video","tagline":"Generate video clips from your prompts using Kling 1.6 (std)","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-26","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v2/master/image-to-video","name":"Kling 2.0 Master","created_by":"fal","source":"official","description":"Generate video clips from your images using Kling 2.0 Master","status":"active","release_date":"2025-04-14","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2/master/image-to-video","tagline":"Generate video clips from your images using Kling 2.0 Master","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2/master/text-to-video","name":"Kling 2.0 Master","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 2.0 Master","status":"active","release_date":"2025-04-14","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2/master/text-to-video","tagline":"Generate video clips from your prompts using Kling 2.0 Master","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.1/master/image-to-video","name":"Kling 2.1 Master","created_by":"fal","source":"official","description":"Kling 2.1 Master: The premium endpoint for Kling 2.1, designed for top-tier image-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","status":"active","release_date":"2025-05-29","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.1/master/image-to-video","tagline":"Kling 2.1 Master: The premium endpoint for Kling 2.1, designed for top-tier image-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.1/master/text-to-video","name":"Kling 2.1 Master","created_by":"fal","source":"official","description":"Kling 2.1 Master: The premium endpoint for Kling 2.1, designed for top-tier text-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","status":"active","release_date":"2025-05-29","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.1/master/text-to-video","tagline":"Kling 2.1 Master: The premium endpoint for Kling 2.1, designed for top-tier text-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.1/pro/image-to-video","name":"Kling 2.1 (pro)","created_by":"fal","source":"official","description":"Kling 2.1 Pro is an advanced endpoint for the Kling 2.1 model, offering professional-grade videos with enhanced visual fidelity, precise camera movements, and dynamic motion control, perfect for cinematic storytelling.","status":"active","release_date":"2025-05-28","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.1/pro/image-to-video","tagline":"Kling 2.1 Pro is an advanced endpoint for the Kling 2.1 model, offering professional-grade videos with enhanced visual fidelity, precise camera movements, and dynamic motion control, perfect for cinem","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.1/standard/image-to-video","name":"Kling 2.1 (standard)","created_by":"fal","source":"official","description":"Kling 2.1 Standard is a cost-efficient endpoint for the Kling 2.1 model, delivering high-quality image-to-video generation \n\n","status":"active","release_date":"2025-05-28","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.1/standard/image-to-video","tagline":"Kling 2.1 Standard is a cost-efficient endpoint for the Kling 2.1 model, delivering high-quality image-to-video generation \n\n","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.5-turbo/pro/image-to-video","name":"Kling Video","created_by":"fal","source":"official","description":"Kling 2.5 Turbo Pro: Top-tier image-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","status":"active","release_date":"2025-09-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.5-turbo/pro/image-to-video","tagline":"Kling 2.5 Turbo Pro: Top-tier image-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.5-turbo/pro/text-to-video","name":"Kling v2.5 Text to Video","created_by":"fal","source":"official","description":"Kling 2.5 Turbo Pro: Top-tier text-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","status":"active","release_date":"2025-09-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.5-turbo/pro/text-to-video","tagline":"Kling 2.5 Turbo Pro: Top-tier text-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.5-turbo/standard/image-to-video","name":"Kling Video","created_by":"fal","source":"official","description":"Kling 2.5 Turbo Standard: Top-tier image-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","status":"active","release_date":"2025-10-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.5-turbo/standard/image-to-video","tagline":"Kling 2.5 Turbo Standard: Top-tier image-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.6/pro/image-to-video","name":"Kling Video v2.6 Image to Video","created_by":"fal","source":"official","description":"Kling 2.6 Pro: Top-tier image-to-video with cinematic visuals, fluid motion, and native audio generation.","status":"active","release_date":"2025-12-02","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.6/pro/image-to-video","tagline":"Kling 2.6 Pro: Top-tier image-to-video with cinematic visuals, fluid motion, and native audio generation.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.6/pro/motion-control","name":"Kling Video v2.6 Motion Control [Pro]","created_by":"fal","source":"official","description":"Transfer movements from a reference video to any character image.","status":"active","release_date":"2025-12-21","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/v2.6/pro/motion-control","tagline":"Transfer movements from a reference video to any character image.","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.6/pro/text-to-video","name":"Kling Video v2.6 Text to Video","created_by":"fal","source":"official","description":"Kling 2.6 Pro: Top-tier text-to-video with cinematic visuals, fluid motion, and native audio generation.","status":"active","release_date":"2025-12-02","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.6/pro/text-to-video","tagline":"Kling 2.6 Pro: Top-tier text-to-video with cinematic visuals, fluid motion, and native audio generation.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.6/standard/motion-control","name":"Kling Video v2.6 Motion Control [Standard]","created_by":"fal","source":"official","description":"Transfer movements from a reference video to any character image.","status":"active","release_date":"2025-12-21","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/v2.6/standard/motion-control","tagline":"Transfer movements from a reference video to any character image.","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/4k/image-to-video","name":"Kling Video","created_by":"fal","source":"official","description":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","status":"active","release_date":"2026-04-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/4k/image-to-video","tagline":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/4k/text-to-video","name":"Kling Video V3 Text to Video 4K","created_by":"fal","source":"official","description":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","status":"active","release_date":"2026-04-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/4k/text-to-video","tagline":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/pro/image-to-video","name":"Kling Video v3 Image to Video [Pro]","created_by":"fal","source":"official","description":"Kling 3.0 Pro: Top-tier image-to-video with cinematic visuals, fluid motion, and native audio generation, with custom element support.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/pro/image-to-video","tagline":"Kling 3.0 Pro: Top-tier image-to-video with cinematic visuals, fluid motion, and native audio generation, with custom element support.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-05-29","last_updated":"2026-06-03"},{"id":"fal-ai/kling-video/v3/pro/motion-control","name":"Kling Video","created_by":"fal","source":"official","description":"Transfer movements from a reference video to any character image.","status":"active","release_date":"2026-03-05","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/v3/pro/motion-control","tagline":"Transfer movements from a reference video to any character image.","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/pro/text-to-video","name":"Kling Video v3 Text to Video [Pro]","created_by":"fal","source":"official","description":"Kling 3.0 Pro: Top-tier text-to-video with cinematic visuals, fluid motion, and native audio generation, with multi-shot support.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/pro/text-to-video","tagline":"Kling 3.0 Pro: Top-tier text-to-video with cinematic visuals, fluid motion, and native audio generation, with multi-shot support.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/standard/image-to-video","name":"Kling Video v3 Image to Video [Standard]","created_by":"fal","source":"official","description":"Kling 3.0 Standard: Top-tier image-to-video with cinematic visuals, fluid motion, and native audio generation, with custom element support.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/standard/image-to-video","tagline":"Kling 3.0 Standard: Top-tier image-to-video with cinematic visuals, fluid motion, and native audio generation, with custom element support.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/standard/motion-control","name":"Kling Video","created_by":"fal","source":"official","description":"Transfer movements from a reference video to any character image.","status":"active","release_date":"2026-03-05","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/v3/standard/motion-control","tagline":"Transfer movements from a reference video to any character image.","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/standard/text-to-video","name":"Kling Video v3 Text to Video [Standard]","created_by":"fal","source":"official","description":"Kling 3.0 Standard: Top-tier text-to-video with cinematic visuals, fluid motion, and native audio generation, with multi-shot support.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/standard/text-to-video","tagline":"Kling 3.0 Standard: Top-tier text-to-video with cinematic visuals, fluid motion, and native audio generation, with multi-shot support.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/turbo/pro/image-to-video","name":"Kling Video V3 Turbo Pro Image to Video","created_by":"fal","source":"official","description":"Generate high quality 1080p videos from images using Kling's Turbo 3.0 model, with improved lipsync and multishot generation capabilities.","status":"active","release_date":"2026-06-16","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/turbo/pro/image-to-video","tagline":"Generate high quality 1080p videos from images using Kling's Turbo 3.0 model, with improved lipsync and multishot generation capabilities.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v3/turbo/pro/text-to-video","name":"Kling Video V3 Turbo Pro Text to Video","created_by":"fal","source":"official","description":"Generate high quality 1080p videos using Kling's Turbo 3.0 model, with improved lipsync and multishot generation capabilities.","status":"active","release_date":"2026-06-16","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/turbo/pro/text-to-video","tagline":"Generate high quality 1080p videos using Kling's Turbo 3.0 model, with improved lipsync and multishot generation capabilities.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v3/turbo/standard/image-to-video","name":"Kling Video V3 Standard Turbo Image to Video","created_by":"fal","source":"official","description":"Kling 3.0 Turbo Standard animates a first and last frame reference image into 720P video with native audio, delivering quick, affordable image-driven motion for fast turnaround","status":"active","release_date":"2026-06-16","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/turbo/standard/image-to-video","tagline":"Kling 3.0 Turbo Standard animates a first and last frame reference image into 720P video with native audio, delivering quick, affordable image-driven motion for fast turnaround","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v3/turbo/standard/text-to-video","name":"Kling Video V3 Standard Turbo Text to Video","created_by":"fal","source":"official","description":"Kling 3.0 Turbo Standard is a fast, cost-efficient video generation model that turns text prompts directly into 720P video with native audio, optimized for rapid iteration and high-volume production","status":"active","release_date":"2026-06-16","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/turbo/standard/text-to-video","tagline":"Kling 3.0 Turbo Standard is a fast, cost-efficient video generation model that turns text prompts directly into 720P video with native audio, optimized for rapid iteration and high-volume production","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/video-to-audio","name":"Kling Video","created_by":"fal","source":"official","description":"Generate audio from input videos using Kling","status":"active","release_date":"2025-10-09","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/video-to-audio","tagline":"Generate audio from input videos using Kling","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/american-english","name":"Kokoro TTS","created_by":"fal","source":"official","description":"Kokoro is a lightweight text-to-speech model that delivers comparable quality to larger models while being significantly faster and more cost-efficient.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/american-english","tagline":"Kokoro is a lightweight text-to-speech model that delivers comparable quality to larger models while being significantly faster and more cost-efficient.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/brazilian-portuguese","name":"Kokoro TTS (Brazilian Portuguese)","created_by":"fal","source":"official","description":"A natural and expressive Brazilian Portuguese text-to-speech model optimized for clarity and fluency.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/brazilian-portuguese","tagline":"A natural and expressive Brazilian Portuguese text-to-speech model optimized for clarity and fluency.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/british-english","name":"Kokoro TTS (British English)","created_by":"fal","source":"official","description":"A high-quality British English text-to-speech model offering natural and expressive voice synthesis.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/british-english","tagline":"A high-quality British English text-to-speech model offering natural and expressive voice synthesis.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/french","name":"Kokoro TTS (French)","created_by":"fal","source":"official","description":"An expressive and natural French text-to-speech model for both European and Canadian French.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/french","tagline":"An expressive and natural French text-to-speech model for both European and Canadian French.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/hindi","name":"Kokoro TTS (Hindi)","created_by":"fal","source":"official","description":"A fast and expressive Hindi text-to-speech model with clear pronunciation and accurate intonation.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/hindi","tagline":"A fast and expressive Hindi text-to-speech model with clear pronunciation and accurate intonation.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/italian","name":"Kokoro TTS (Italian)","created_by":"fal","source":"official","description":"A high-quality Italian text-to-speech model delivering smooth and expressive speech synthesis.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/italian","tagline":"A high-quality Italian text-to-speech model delivering smooth and expressive speech synthesis.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/japanese","name":"Kokoro TTS (Japanese)","created_by":"fal","source":"official","description":"A fast and natural-sounding Japanese text-to-speech model optimized for smooth pronunciation.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/japanese","tagline":"A fast and natural-sounding Japanese text-to-speech model optimized for smooth pronunciation.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/mandarin-chinese","name":"Kokoro TTS (Mandarin Chinese)","created_by":"fal","source":"official","description":"A highly efficient Mandarin Chinese text-to-speech model that captures natural tones and prosody.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/mandarin-chinese","tagline":"A highly efficient Mandarin Chinese text-to-speech model that captures natural tones and prosody.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/spanish","name":"Kokoro TTS (Spanish)","created_by":"fal","source":"official","description":"A natural-sounding Spanish text-to-speech model optimized for Latin American and European Spanish.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/spanish","tagline":"A natural-sounding Spanish text-to-speech model optimized for Latin American and European Spanish.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kolors/image-to-image","name":"Kolors Image to Image","created_by":"fal","source":"official","description":"Photorealistic Image-to-Image","status":"active","release_date":"2024-11-19","model_type":"image","page_url":"https://fal.run/fal-ai/kolors/image-to-image","tagline":"Photorealistic Image-to-Image","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kolors","name":"Kolors","created_by":"fal","source":"official","description":"Photorealistic Text-to-Image","status":"active","release_date":"2024-07-24","model_type":"image","page_url":"https://fal.run/fal-ai/kolors","tagline":"Photorealistic Text-to-Image","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/krea-2-trainer","name":"Krea 2 Trainer","created_by":"fal","source":"official","description":"Train a custom LoRA on your own images to teach Krea 2 a new subject, character, or style.","status":"active","release_date":"2026-06-19","model_type":"other","page_url":"https://fal.run/fal-ai/krea-2-trainer","tagline":"Train a custom LoRA on your own images to teach Krea 2 a new subject, character, or style.","capabilities":{"vision":true},"last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/krea-2/turbo/lora","name":"Krea 2 Text to Image Turbo LoRA","created_by":"fal","source":"official","description":"Generate high-fidelity images from text with Krea 2 using a custom-trained LoRA.","status":"active","release_date":"2026-06-19","model_type":"image","page_url":"https://fal.run/fal-ai/krea-2/turbo/lora","tagline":"Generate high-fidelity images from text with Krea 2 using a custom-trained LoRA.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/krea-2/turbo","name":"Krea 2 Turbo","created_by":"fal","source":"official","description":"Generate high-fidelity images from text in seconds with Krea 2 Turbo, the speed-optimized open-source version of Krea 2, preserving its aesthetic range for rapid ideation.","status":"active","release_date":"2026-06-18","model_type":"image","page_url":"https://fal.run/fal-ai/krea-2/turbo","tagline":"Generate high-fidelity images from text in seconds with Krea 2 Turbo, the speed-optimized open-source version of Krea 2, preserving its aesthetic range for rapid ideation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/krea-wan-14b/text-to-video","name":"Krea Wan 14b- Text to Video","created_by":"fal","source":"official","description":"Fast Text-to-Video endpoint for Krea's Wan 14b model.","status":"active","release_date":"2025-10-20","model_type":"video","page_url":"https://fal.run/fal-ai/krea-wan-14b/text-to-video","tagline":"Fast Text-to-Video endpoint for Krea's Wan 14b model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/krea-wan-14b/video-to-video","name":"Krea Wan 14B","created_by":"fal","source":"official","description":"Superfast video model based on Wan 2.1 14b by Krea, excelling at real-time video-editing.","status":"active","release_date":"2025-10-14","model_type":"other","page_url":"https://fal.run/fal-ai/krea-wan-14b/video-to-video","tagline":"Superfast video model based on Wan 2.1 14b by Krea, excelling at real-time video-editing.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/latentsync","name":"LatentSync","created_by":"fal","source":"official","description":"LatentSync is a video-to-video model that generates lip sync animations from audio using advanced algorithms for high-quality synchronization.","status":"active","release_date":"2025-03-25","model_type":"other","page_url":"https://fal.run/fal-ai/latentsync","tagline":"LatentSync is a video-to-video model that generates lip sync animations from audio using advanced algorithms for high-quality synchronization.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/lava-sr","name":"Lava SR","created_by":"fal","source":"official","description":"Enhance muffled 16 kHz speech audio into crystal-clear 48 kHz, with denoising for particularly bad inputs.","status":"active","release_date":"2026-02-23","model_type":"other","page_url":"https://fal.run/fal-ai/lava-sr","tagline":"Enhance muffled 16 kHz speech audio into crystal-clear 48 kHz, with denoising for particularly bad inputs.","last_seen_at":"2026-02-23","last_updated":"2026-05-11"},{"id":"fal-ai/layer-diffusion","name":"Layer Diffusion XL","created_by":"fal","source":"official","description":"SDXL with an alpha channel.","status":"active","release_date":"2024-04-13","model_type":"image","page_url":"https://fal.run/fal-ai/layer-diffusion","tagline":"SDXL with an alpha channel.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/lcm-sd15-i2i","name":"Optimized Latent Consistency (SDv1.5)","created_by":"fal","source":"official","description":"Produce high-quality images with minimal inference steps.","status":"active","release_date":"2023-11-09","model_type":"image","page_url":"https://fal.run/fal-ai/lcm-sd15-i2i","tagline":"Produce high-quality images with minimal inference steps.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/lcm","name":"Latent Consistency (SDXL & SDv1.5)","created_by":"fal","source":"official","description":"Produce high-quality images with minimal inference steps.","status":"active","release_date":"2024-02-04","model_type":"image","page_url":"https://fal.run/fal-ai/lcm","tagline":"Produce high-quality images with minimal inference steps.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/leffa/pose-transfer","name":"Leffa Pose Transfer","created_by":"fal","source":"official","description":"Leffa Pose Transfer is an endpoint for changing pose of an image with a reference image.","status":"active","release_date":"2024-12-17","model_type":"image","page_url":"https://fal.run/fal-ai/leffa/pose-transfer","tagline":"Leffa Pose Transfer is an endpoint for changing pose of an image with a reference image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/leffa/virtual-tryon","name":"Leffa Virtual TryOn","created_by":"fal","source":"official","description":"Leffa Virtual TryOn is a high quality image based Try-On endpoint which can be used for commercial try on.","status":"active","release_date":"2024-12-17","model_type":"image","page_url":"https://fal.run/fal-ai/leffa/virtual-tryon","tagline":"Leffa Virtual TryOn is a high quality image based Try-On endpoint which can be used for commercial try on.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/lightning-models","name":"Lightning Models","created_by":"fal","source":"official","description":"Collection of SDXL Lightning models.","status":"active","release_date":"2024-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/lightning-models","tagline":"Collection of SDXL Lightning models.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/lightx/recamera","name":"Lightx","created_by":"fal","source":"official","description":"Use the capabilities of lightx to relight and recamera your videos.","status":"active","release_date":"2025-12-22","model_type":"other","page_url":"https://fal.run/fal-ai/lightx/recamera","tagline":"Use the capabilities of lightx to relight and recamera your videos.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/lightx/relight","name":"Lightx","created_by":"fal","source":"official","description":"Use tlightx capabilities to relight and recamera your videos.","status":"active","release_date":"2025-12-22","model_type":"other","page_url":"https://fal.run/fal-ai/lightx/relight","tagline":"Use tlightx capabilities to relight and recamera your videos.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/live-portrait/image","name":"Live Portrait","created_by":"fal","source":"official","description":"Transfer expression from a video to a portrait.","status":"active","release_date":"2024-10-01","model_type":"image","page_url":"https://fal.run/fal-ai/live-portrait/image","tagline":"Transfer expression from a video to a portrait.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/live-portrait","name":"Live Portrait","created_by":"fal","source":"official","description":"Transfer expression from a video to a portrait.","status":"active","release_date":"2024-07-09","model_type":"video","page_url":"https://fal.run/fal-ai/live-portrait","tagline":"Transfer expression from a video to a portrait.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/llava-next","name":"LLaVA v1.6 34B","created_by":"fal","source":"official","description":"Vision","status":"active","release_date":"2024-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/llava-next","tagline":"Vision","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/longcat-image/edit","name":"Longcat Image","created_by":"fal","source":"official","description":"LongCat image Edit is a 6B parameter image editing model excelling at multilingual text rendering, photorealism and deployment efficiency.","status":"active","release_date":"2025-12-05","model_type":"image","page_url":"https://fal.run/fal-ai/longcat-image/edit","tagline":"LongCat image Edit is a 6B parameter image editing model excelling at multilingual text rendering, photorealism and deployment efficiency.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-image","name":"Longcat Image","created_by":"fal","source":"official","description":"LongCat image is a 6B parameter model excelling at multilingual text rendering, photorealism and deployment efficiency.","status":"active","release_date":"2025-12-05","model_type":"image","page_url":"https://fal.run/fal-ai/longcat-image","tagline":"LongCat image is a 6B parameter model excelling at multilingual text rendering, photorealism and deployment efficiency.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-multi-avatar/image-audio-to-video/multi-speaker","name":"Longcat Multi Avatar","created_by":"fal","source":"official","description":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/longcat-multi-avatar/image-audio-to-video/multi-speaker","tagline":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-multi-avatar/image-audio-to-video","name":"Longcat Multi Avatar","created_by":"fal","source":"official","description":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","status":"active","release_date":"2026-01-08","model_type":"other","page_url":"https://fal.run/fal-ai/longcat-multi-avatar/image-audio-to-video","tagline":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-single-avatar/audio-to-video","name":"Longcat Single Avatar","created_by":"fal","source":"official","description":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/longcat-single-avatar/audio-to-video","tagline":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-single-avatar/image-audio-to-video","name":"Longcat Single Avatar","created_by":"fal","source":"official","description":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/longcat-single-avatar/image-audio-to-video","tagline":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/distilled/image-to-video/480p","name":"LongCat Video Distilled","created_by":"fal","source":"official","description":"Generate long videos from images using LongCat Video Distilled","status":"active","release_date":"2025-10-29","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/distilled/image-to-video/480p","tagline":"Generate long videos from images using LongCat Video Distilled","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/distilled/image-to-video/720p","name":"LongCat Video Distilled","created_by":"fal","source":"official","description":"Generate long videos in 720p/30fps from images using LongCat Video Distilled","status":"active","release_date":"2025-10-30","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/distilled/image-to-video/720p","tagline":"Generate long videos in 720p/30fps from images using LongCat Video Distilled","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/distilled/text-to-video/480p","name":"LongCat Video Distilled","created_by":"fal","source":"official","description":"Generate long videos from text using LongCat Video Distilled","status":"active","release_date":"2025-10-28","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/distilled/text-to-video/480p","tagline":"Generate long videos from text using LongCat Video Distilled","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/distilled/text-to-video/720p","name":"LongCat Video Distilled","created_by":"fal","source":"official","description":"Generate long videos in 720p/30fps from text using LongCat Video Distilled","status":"active","release_date":"2025-10-30","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/distilled/text-to-video/720p","tagline":"Generate long videos in 720p/30fps from text using LongCat Video Distilled","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/image-to-video/480p","name":"LongCat Video","created_by":"fal","source":"official","description":"Generate long videos from images using LongCat Video","status":"active","release_date":"2025-10-30","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/image-to-video/480p","tagline":"Generate long videos from images using LongCat Video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/image-to-video/720p","name":"LongCat Video","created_by":"fal","source":"official","description":"Generate long videos in 720p/30fps from images using LongCat Video","status":"active","release_date":"2025-10-30","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/image-to-video/720p","tagline":"Generate long videos in 720p/30fps from images using LongCat Video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/text-to-video/480p","name":"LongCat Video","created_by":"fal","source":"official","description":"Generate long videos from text using LongCat Video","status":"active","release_date":"2025-10-30","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/text-to-video/480p","tagline":"Generate long videos from text using LongCat Video","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/text-to-video/720p","name":"LongCat Video","created_by":"fal","source":"official","description":"Generate long videos in 720p/30fps from text using LongCat Video","status":"active","release_date":"2025-10-30","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/text-to-video/720p","tagline":"Generate long videos in 720p/30fps from text using LongCat Video","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/lora/image-to-image","name":"Stable Diffusion with LoRAs","created_by":"fal","source":"official","description":"Run Any Stable Diffusion model with customizable LoRA weights.","status":"active","release_date":"2024-04-17","model_type":"image","page_url":"https://fal.run/fal-ai/lora/image-to-image","tagline":"Run Any Stable Diffusion model with customizable LoRA weights.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/lora/inpaint","name":"Stable Diffusion with LoRAs","created_by":"fal","source":"official","description":"Run Any Stable Diffusion model with customizable LoRA weights.","status":"active","release_date":"2024-04-18","model_type":"image","page_url":"https://fal.run/fal-ai/lora/inpaint","tagline":"Run Any Stable Diffusion model with customizable LoRA weights.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/lora","name":"Stable Diffusion with LoRAs","created_by":"fal","source":"official","description":"Run Any Stable Diffusion model with customizable LoRA weights.","status":"active","release_date":"2023-09-26","model_type":"image","page_url":"https://fal.run/fal-ai/lora","tagline":"Run Any Stable Diffusion model with customizable LoRA weights.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-2-19b/audio-to-video/lora","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2 and custom LoRA","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/audio-to-video/lora","tagline":"Generate video with audio from audio, text and images using LTX-2 and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/audio-to-video","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/audio-to-video","tagline":"Generate video with audio from audio, text and images using LTX-2","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/audio-to-video/lora","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2 Distilled and custom LoRA","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/audio-to-video/lora","tagline":"Generate video with audio from audio, text and images using LTX-2 Distilled and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/audio-to-video","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2 Distilled","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/audio-to-video","tagline":"Generate video with audio from audio, text and images using LTX-2 Distilled","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/extend-video/lora","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Extend videos with audio using LTX-2 Distilled and custom LoRA","status":"active","release_date":"2026-01-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/extend-video/lora","tagline":"Extend videos with audio using LTX-2 Distilled and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/extend-video","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Extend videos with audio using LTX-2 Distilled","status":"active","release_date":"2026-01-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/extend-video","tagline":"Extend videos with audio using LTX-2 Distilled","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/image-to-video/lora","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2 Distilled and custom LoRA","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/image-to-video/lora","tagline":"Generate video with audio from images using LTX-2 Distilled and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/image-to-video","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2 Distilled","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/image-to-video","tagline":"Generate video with audio from images using LTX-2 Distilled","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/text-to-video/lora","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2 Distilled and custom LoRA","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/text-to-video/lora","tagline":"Generate video with audio from text using LTX-2 Distilled and custom LoRA","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/text-to-video","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2 Distilled","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/text-to-video","tagline":"Generate video with audio from text using LTX-2 Distilled","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/video-to-video/lora","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2 Distilled and custom LoRA","status":"active","release_date":"2026-01-07","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/video-to-video/lora","tagline":"Generate video with audio from videos using LTX-2 Distilled and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/video-to-video","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2 Distilled","status":"active","release_date":"2026-01-07","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/video-to-video","tagline":"Generate video with audio from videos using LTX-2 Distilled","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/extend-video/lora","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Extend video with audio using LTX-2 and custom LoRA","status":"active","release_date":"2026-01-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/extend-video/lora","tagline":"Extend video with audio using LTX-2 and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/extend-video","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Extend video with audio using LTX-2","status":"active","release_date":"2026-01-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/extend-video","tagline":"Extend video with audio using LTX-2","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/image-to-video/lora","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2 and custom LoRA","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/image-to-video/lora","tagline":"Generate video with audio from images using LTX-2 and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/image-to-video","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/image-to-video","tagline":"Generate video with audio from images using LTX-2","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/text-to-video/lora","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2 and custom LoRA","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/text-to-video/lora","tagline":"Generate video with audio from text using LTX-2 and custom LoRA","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/text-to-video","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/text-to-video","tagline":"Generate video with audio from text using LTX-2","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/video-to-video/lora","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2 and custom LoRA","status":"active","release_date":"2026-01-07","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/video-to-video/lora","tagline":"Generate video with audio from videos using LTX-2 and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/video-to-video","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2","status":"active","release_date":"2026-01-07","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/video-to-video","tagline":"Generate video with audio from videos using LTX-2","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2/audio-to-video","name":"LTX 2.0 Video Pro","created_by":"fal","source":"official","description":"Generate video from audio using LTX-2","status":"active","release_date":"2026-03-04","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2/audio-to-video","tagline":"Generate video from audio using LTX-2","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2/extend-video","name":"LTX Video 2.0 Pro","created_by":"fal","source":"official","description":"Extends videos with audio using LTX-2","status":"active","release_date":"2026-03-04","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2/extend-video","tagline":"Extends videos with audio using LTX-2","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2/image-to-video/fast","name":"LTX Video 2.0 Fast","created_by":"fal","source":"official","description":"Create high-fidelity video with audio from images with LTX-2 Fast","status":"active","release_date":"2025-11-26","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2/image-to-video/fast","tagline":"Create high-fidelity video with audio from images with LTX-2 Fast","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2/image-to-video","name":"LTX Video 2.0 Pro","created_by":"fal","source":"official","description":"Create high-fidelity video with audio from images with LTX-2 Pro","status":"active","release_date":"2025-11-26","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2/image-to-video","tagline":"Create high-fidelity video with audio from images with LTX-2 Pro","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2/retake-video","name":"LTX Video 2.0 Retake","created_by":"fal","source":"official","description":"Change sections of a video using LTX-2","status":"active","release_date":"2025-11-26","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2/retake-video","tagline":"Change sections of a video using LTX-2","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2/text-to-video/fast","name":"LTX Video 2.0 Fast","created_by":"fal","source":"official","description":"Create high-fidelity video with audio from text with LTX-2 Fast","status":"active","release_date":"2025-11-26","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2/text-to-video/fast","tagline":"Create high-fidelity video with audio from text with LTX-2 Fast","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2/text-to-video","name":"LTX Video 2.0 Pro","created_by":"fal","source":"official","description":"Create high-fidelity video with audio from text with LTX-2 Pro.","status":"active","release_date":"2025-11-26","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2/text-to-video","tagline":"Create high-fidelity video with audio from text with LTX-2 Pro.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/audio-to-video/lora","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/audio-to-video/lora","tagline":"Generate video with audio from audio, text and images using LTX-2.3 and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/audio-to-video","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/audio-to-video","tagline":"Generate video with audio from audio, text and images using LTX-2","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/audio-to-video/lora","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2.3 Distilled and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/audio-to-video/lora","tagline":"Generate video with audio from audio, text and images using LTX-2.3 Distilled and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/audio-to-video","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2 Distilled","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/audio-to-video","tagline":"Generate video with audio from audio, text and images using LTX-2 Distilled","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/image-to-video/lora","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2.3 Distilled and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/image-to-video/lora","tagline":"Generate video with audio from images using LTX-2.3 Distilled and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/image-to-video","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2.3 Distilled","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/image-to-video","tagline":"Generate video with audio from images using LTX-2.3 Distilled","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/reference-video-to-video/lora","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from reference videos using LTX-2.3 Distilled and custom LoRA","status":"active","release_date":"2026-04-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/reference-video-to-video/lora","tagline":"Generate video with audio from reference videos using LTX-2.3 Distilled and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/reference-video-to-video","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from reference videos using LTX-2.3 Distilled","status":"active","release_date":"2026-04-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/reference-video-to-video","tagline":"Generate video with audio from reference videos using LTX-2.3 Distilled","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/text-to-video/lora","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2.3 Distilled and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/text-to-video/lora","tagline":"Generate video with audio from text using LTX-2.3 Distilled and custom LoRA","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/text-to-video","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2.3 Distilled","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/text-to-video","tagline":"Generate video with audio from text using LTX-2.3 Distilled","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/video-to-video/lora","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2.3 Distilled and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/video-to-video/lora","tagline":"Generate video with audio from videos using LTX-2.3 Distilled and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/video-to-video","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2.3 Distilled","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/video-to-video","tagline":"Generate video with audio from videos using LTX-2.3 Distilled","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/extend-video/lora","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Extend video with audio using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/extend-video/lora","tagline":"Extend video with audio using LTX-2.3 and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/extend-video","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Extend video with audio using LTX-2.3","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/extend-video","tagline":"Extend video with audio using LTX-2.3","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/image-to-video/lora","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/image-to-video/lora","tagline":"Generate video with audio from images using LTX-2.3 and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/image-to-video","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2.3","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/image-to-video","tagline":"Generate video with audio from images using LTX-2.3","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/reference-video-to-video/lora","name":"LTX 2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from reference video, text and images using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-04-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/reference-video-to-video/lora","tagline":"Generate video with audio from reference video, text and images using LTX-2.3 and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/reference-video-to-video","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from reference video, text and images using LTX-2.3","status":"active","release_date":"2026-04-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/reference-video-to-video","tagline":"Generate video with audio from reference video, text and images using LTX-2.3","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/text-to-video/lora","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/text-to-video/lora","tagline":"Generate video with audio from text using LTX-2.3 and custom LoRA","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/text-to-video","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2.3","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/text-to-video","tagline":"Generate video with audio from text using LTX-2.3","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/video-to-video/lora","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/video-to-video/lora","tagline":"Generate video with audio from videos using LTX-2.3 and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/video-to-video","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2.3","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/video-to-video","tagline":"Generate video with audio from videos using LTX-2.3","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3/audio-to-video","name":"LTX 2.3 Video Pro","created_by":"fal","source":"official","description":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","status":"active","release_date":"2026-03-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3/audio-to-video","tagline":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3/extend-video","name":"LTX Video 2.3 Pro","created_by":"fal","source":"official","description":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","status":"active","release_date":"2026-03-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3/extend-video","tagline":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3/image-to-video/fast","name":"LTX 2.3 Video Fast","created_by":"fal","source":"official","description":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","status":"active","release_date":"2026-03-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3/image-to-video/fast","tagline":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3/image-to-video","name":"LTX 2.3 Video Pro","created_by":"fal","source":"official","description":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","status":"active","release_date":"2026-03-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3/image-to-video","tagline":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/audio-to-video/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from audio, text and images using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-06-01","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/audio-to-video/lora","tagline":"Generate high-quality video with audio from audio, text and images using LTX-2.3 and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/audio-to-video","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from audio, text and images using LTX-2","status":"active","release_date":"2026-06-01","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/audio-to-video","tagline":"Generate high-quality video with audio from audio, text and images using LTX-2","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/colorization","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Colorize high-quality video using LTX-2.3","status":"active","release_date":"2026-06-24","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/colorization","tagline":"Colorize high-quality video using LTX-2.3","last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/cross-eyed","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Cross-eyes for high-quality video using LTX-2.3","status":"active","release_date":"2026-06-25","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/cross-eyed","tagline":"Cross-eyes for high-quality video using LTX-2.3","last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/day-to-night","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Day to Night for high-quality video using LTX-2.3","status":"active","release_date":"2026-06-25","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/day-to-night","tagline":"Day to Night for high-quality video using LTX-2.3","last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/deblur","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Deblur high-quality video using LTX-2.3\n","status":"active","release_date":"2026-06-24","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/deblur","tagline":"Deblur high-quality video using LTX-2.3\n","last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/decompression","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Decompression / Denoise high-quality video using LTX-2.3","status":"active","release_date":"2026-06-25","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/decompression","tagline":"Decompression / Denoise high-quality video using LTX-2.3","last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/hdr/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate HDR from reference video using LTX-2.3 with lora","status":"active","release_date":"2026-06-01","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/hdr/lora","tagline":"Generate HDR from reference video using LTX-2.3 with lora","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/hdr","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate HDR from reference video using LTX-2.3 ","status":"active","release_date":"2026-06-01","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/hdr","tagline":"Generate HDR from reference video using LTX-2.3 ","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/image-to-video/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from images using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-06-01","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/image-to-video/lora","tagline":"Generate high-quality video with audio from images using LTX-2.3 and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/image-to-video","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from images using LTX-2.3","status":"active","release_date":"2026-06-01","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/image-to-video","tagline":"Generate high-quality video with audio from images using LTX-2.3","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/ingredient","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from reference, character sheet, storyboard using LTX-2.3","status":"active","release_date":"2026-06-18","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/ingredient","tagline":"Generate high-quality video with audio from reference, character sheet, storyboard using LTX-2.3","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/inpaint/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Inpaint high-quality video using LTX-2.3 with lora","status":"active","release_date":"2026-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/inpaint/lora","tagline":"Inpaint high-quality video using LTX-2.3 with lora","last_seen_at":"2026-06-18","last_updated":"2026-06-18"},{"id":"fal-ai/ltx-2.3-quality/inpaint","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Inpaint high-quality video using LTX-2.3 ","status":"active","release_date":"2026-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/inpaint","tagline":"Inpaint high-quality video using LTX-2.3 ","last_seen_at":"2026-06-18","last_updated":"2026-06-18"},{"id":"fal-ai/ltx-2.3-quality/instant-shave","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Instant shave high-quality video using LTX-2.3","status":"active","release_date":"2026-06-25","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/instant-shave","tagline":"Instant shave high-quality video using LTX-2.3","last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/outpaint/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Outpaint high-quality video using LTX-2.3 with Lora","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/outpaint/lora","tagline":"Outpaint high-quality video using LTX-2.3 with Lora","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/outpaint","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Outpaint high-quality video using LTX-2.3 ","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/outpaint","tagline":"Outpaint high-quality video using LTX-2.3 ","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/reference-video-to-video/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from reference video, text and images using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-06-01","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/reference-video-to-video/lora","tagline":"Generate high-quality video with audio from reference video, text and images using LTX-2.3 and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/reference-video-to-video","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from reference video, text and images using LTX-2.3","status":"active","release_date":"2026-06-01","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/reference-video-to-video","tagline":"Generate high-quality video with audio from reference video, text and images using LTX-2.3","capabilities":{"vision":true},"last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/render-to-real","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Transform your 3D video render into realistic using first frame with Ltx 2.3","status":"active","release_date":"2026-06-26","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/render-to-real","tagline":"Transform your 3D video render into realistic using first frame with Ltx 2.3","last_seen_at":"2026-06-26","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/text-to-audio/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Text to Audio high-quality using LTX-2.3 with Lora","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/text-to-audio/lora","tagline":"Text to Audio high-quality using LTX-2.3 with Lora","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/text-to-audio","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Text to Audio high-quality using LTX-2.3 ","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/text-to-audio","tagline":"Text to Audio high-quality using LTX-2.3 ","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/text-to-video/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from text using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-06-01","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/text-to-video/lora","tagline":"Generate high-quality video with audio from text using LTX-2.3 and custom LoRA","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/text-to-video","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from text using LTX-2.3","status":"active","release_date":"2026-06-01","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/text-to-video","tagline":"Generate high-quality video with audio from text using LTX-2.3","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/water-simulation","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Water Simulation transformation for high-quality video using LTX-2.3","status":"active","release_date":"2026-06-25","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/water-simulation","tagline":"Water Simulation transformation for high-quality video using LTX-2.3","last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3/retake-video","name":"LTX Video 2.3 Pro","created_by":"fal","source":"official","description":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","status":"active","release_date":"2026-03-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3/retake-video","tagline":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3/text-to-video/fast","name":"LTX 2.3 Video Fast","created_by":"fal","source":"official","description":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","status":"active","release_date":"2026-03-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3/text-to-video/fast","tagline":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3/text-to-video","name":"LTX Video 2.3 Pro","created_by":"fal","source":"official","description":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","status":"active","release_date":"2026-03-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3/text-to-video","tagline":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video-13b-dev/extend","name":"LTX Video-0.9.7 13B","created_by":"fal","source":"official","description":"Extend videos using LTX Video-0.9.7 13B and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"other","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-dev/extend","tagline":"Extend videos using LTX Video-0.9.7 13B and custom LoRA","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-video-13b-dev/image-to-video","name":"LTX Video-0.9.7 13B","created_by":"fal","source":"official","description":"Generate videos from prompts and images using LTX Video-0.9.7 13B and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"video","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-dev/image-to-video","tagline":"Generate videos from prompts and images using LTX Video-0.9.7 13B and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-video-13b-dev/multiconditioning","name":"LTX Video-0.9.7 13B","created_by":"fal","source":"official","description":"Generate videos from prompts, images, and videos using LTX Video-0.9.7 13B and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"other","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-dev/multiconditioning","tagline":"Generate videos from prompts, images, and videos using LTX Video-0.9.7 13B and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-video-13b-dev","name":"LTX Video-0.9.7 13B","created_by":"fal","source":"official","description":"Generate videos from prompts using LTX Video-0.9.7 13B and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"video","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-dev","tagline":"Generate videos from prompts using LTX Video-0.9.7 13B and custom LoRA","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-video-13b-distilled/extend","name":"LTX Video-0.9.7 13B Distilled","created_by":"fal","source":"official","description":"Extend videos using LTX Video-0.9.7 13B Distilled and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"other","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-distilled/extend","tagline":"Extend videos using LTX Video-0.9.7 13B Distilled and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video-13b-distilled/image-to-video","name":"LTX Video-0.9.7 13B Distilled","created_by":"fal","source":"official","description":"Generate videos from prompts and images using LTX Video-0.9.7 13B Distilled and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"video","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-distilled/image-to-video","tagline":"Generate videos from prompts and images using LTX Video-0.9.7 13B Distilled and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video-13b-distilled/multiconditioning","name":"LTX Video-0.9.7 13B Distilled","created_by":"fal","source":"official","description":"Generate videos from prompts, images, and videos using LTX Video-0.9.7 13B Distilled and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"other","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-distilled/multiconditioning","tagline":"Generate videos from prompts, images, and videos using LTX Video-0.9.7 13B Distilled and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video-13b-distilled","name":"LTX Video-0.9.7 13B Distilled","created_by":"fal","source":"official","description":"Generate videos from prompts using LTX Video-0.9.7 13B Distilled and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"video","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-distilled","tagline":"Generate videos from prompts using LTX Video-0.9.7 13B Distilled and custom LoRA","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video/image-to-video","name":"LTX Video (preview)","created_by":"fal","source":"official","description":"Generate videos from images using LTX Video","status":"active","release_date":"2024-11-21","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-video/image-to-video","tagline":"Generate videos from images using LTX Video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video-lora/image-to-video","name":"LTX Video-0.9.7 LoRA","created_by":"fal","source":"official","description":"Generate videos from prompts and images using LTX Video-0.9.7 and custom LoRA","status":"active","release_date":"2025-05-15","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-video-lora/image-to-video","tagline":"Generate videos from prompts and images using LTX Video-0.9.7 and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-video-lora/multiconditioning","name":"LTX Video-0.9.7 LoRA","created_by":"fal","source":"official","description":"Generate videos from prompts, images, and videos using LTX Video-0.9.7 and custom LoRA","status":"active","release_date":"2025-05-15","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-video-lora/multiconditioning","tagline":"Generate videos from prompts, images, and videos using LTX Video-0.9.7 and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-video-trainer","name":"LTX Video Trainer","created_by":"fal","source":"official","description":"Train LTX Video 0.9.7 for custom styles and effects.","status":"active","release_date":"2025-05-08","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-video-trainer","tagline":"Train LTX Video 0.9.7 for custom styles and effects.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-video-v095/extend","name":"LTX Video-0.9.5","created_by":"fal","source":"official","description":"Generate videos from prompts and videos using LTX Video-0.9.5","status":"active","release_date":"2025-03-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-video-v095/extend","tagline":"Generate videos from prompts and videos using LTX Video-0.9.5","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video-v095/multiconditioning","name":"LTX Video-0.9.5","created_by":"fal","source":"official","description":"Generate videos from prompts,images, and videos using LTX Video-0.9.5","status":"active","release_date":"2025-03-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-video-v095/multiconditioning","tagline":"Generate videos from prompts,images, and videos using LTX Video-0.9.5","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video-v095","name":"LTX Video-0.9.5","created_by":"fal","source":"official","description":"Generate videos from prompts using LTX Video-0.9.5","status":"active","release_date":"2025-03-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-video-v095","tagline":"Generate videos from prompts using LTX Video-0.9.5","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video","name":"LTX Video (preview)","created_by":"fal","source":"official","description":"Generate videos from prompts using LTX Video","status":"active","release_date":"2024-10-04","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-video","tagline":"Generate videos from prompts using LTX Video","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx2-v2v-trainer","name":"LTX-2 Video to Video Trainer","created_by":"fal","source":"official","description":"Train LTX-2 for video transformation or video-conditioned generation.","status":"active","release_date":"2026-01-07","model_type":"other","page_url":"https://fal.run/fal-ai/ltx2-v2v-trainer","tagline":"Train LTX-2 for video transformation or video-conditioned generation.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx2-video-trainer","name":"LTX-2 Video Trainer","created_by":"fal","source":"official","description":"Train LTX-2 for custom styles and effects.","status":"active","release_date":"2026-01-03","model_type":"other","page_url":"https://fal.run/fal-ai/ltx2-video-trainer","tagline":"Train LTX-2 for custom styles and effects.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ltx23-trainer-v2/a2a","name":"LTX 2.3 Trainer (V2) - Audio-to-Audio","created_by":"fal","source":"official","description":"Train a LoRA that transforms one audio clip into another, learning a reference→target mapping from paired audio examples.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/a2a","tagline":"Train a LoRA that transforms one audio clip into another, learning a reference→target mapping from paired audio examples.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/a2v","name":"LTX 2.3 Trainer (V2) - Audio-to-Video","created_by":"fal","source":"official","description":"Train a LoRA that generates video from a start image plus a conditioning audio track, producing motion that matches the sound.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/a2v","tagline":"Train a LoRA that generates video from a start image plus a conditioning audio track, producing motion that matches the sound.","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/audio-extend-prefix","name":"LTX 2.3 Trainer (V2) - Forward Audio Extension","created_by":"fal","source":"official","description":"Train a LoRA that continues an audio clip forward in time, generating the audio that follows a short clean prefix.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/audio-extend-prefix","tagline":"Train a LoRA that continues an audio clip forward in time, generating the audio that follows a short clean prefix.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/audio-extend-suffix","name":"LTX 2.3 Trainer (V2) - Backward Audio Extension","created_by":"fal","source":"official","description":"Train a LoRA that generates the lead-in to an audio clip, extending audio backward in time from its ending.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/audio-extend-suffix","tagline":"Train a LoRA that generates the lead-in to an audio clip, extending audio backward in time from its ending.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/audio-inpaint","name":"LTX 2.3 Trainer (V2) - Audio Inpainting","created_by":"fal","source":"official","description":"Train a LoRA that regenerates masked time spans of an audio clip while keeping the rest unchanged.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/audio-inpaint","tagline":"Train a LoRA that regenerates masked time spans of an audio clip while keeping the rest unchanged.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/av2av-masked","name":"LTX 2.3 Trainer (V2) - Masked Audio+Video Transformation","created_by":"fal","source":"official","description":"Train a LoRA that regenerates a masked video region (guided by kept pixels and a video reference) while jointly generating audio from an audio reference.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/av2av-masked","tagline":"Train a LoRA that regenerates a masked video region (guided by kept pixels and a video reference) while jointly generating audio from an audio reference.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/av2av","name":"LTX 2.3 Trainer (V2) - Audio+Video Reference Transformation","created_by":"fal","source":"official","description":"Train a LoRA for a joint audio+video transformation, conditioned on a reference clip (its video and audio) to produce a matching target clip.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/av2av","tagline":"Train a LoRA for a joint audio+video transformation, conditioned on a reference clip (its video and audio) to produce a matching target clip.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/extend-prefix","name":"LTX 2.3 Trainer (V2) - Forward Video Extension","created_by":"fal","source":"official","description":"Train a LoRA that continues a video forward in time — supply an opening clip at inference and the model generates what comes next.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/extend-prefix","tagline":"Train a LoRA that continues a video forward in time — supply an opening clip at inference and the model generates what comes next.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/extend-suffix","name":"LTX 2.3 Trainer (V2) - Backward Video Extension","created_by":"fal","source":"official","description":"Train a LoRA that generates the lead-in to a video, extending a clip backward in time from its ending.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/extend-suffix","tagline":"Train a LoRA that generates the lead-in to a video, extending a clip backward in time from its ending.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/i2v","name":"LTX 2.3 Trainer (V2) - Image-to-Video","created_by":"fal","source":"official","description":"Fine-tune LTX 2.3 to animate a starting image — supply a still plus a prompt at inference and the model generates a video that begins from that frame.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/i2v","tagline":"Fine-tune LTX 2.3 to animate a starting image — supply a still plus a prompt at inference and the model generates a video that begins from that frame.","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/ic-lora/a2a","name":"LTX 2.3 Trainer (V2) - Audio-to-Audio IC-LoRA","created_by":"fal","source":"official","description":"Train an IC-LoRA that transforms one audio clip into another, conditioned at inference on a reference audio clip.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/ic-lora/a2a","tagline":"Train an IC-LoRA that transforms one audio clip into another, conditioned at inference on a reference audio clip.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/ic-lora/av2av-masked","name":"LTX 2.3 Trainer (V2) - Masked Audio+Video IC-LoRA","created_by":"fal","source":"official","description":"Train an IC-LoRA that regenerates a masked video region (guided by kept pixels and a video reference) while jointly generating audio from an audio reference.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/ic-lora/av2av-masked","tagline":"Train an IC-LoRA that regenerates a masked video region (guided by kept pixels and a video reference) while jointly generating audio from an audio reference.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/ic-lora/av2av","name":"LTX 2.3 Trainer (V2) - Audio+Video Reference IC-LoRA","created_by":"fal","source":"official","description":"Train an IC-LoRA for a joint audio+video transformation, conditioned on a reference clip's video and audio to produce a matching target.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/ic-lora/av2av","tagline":"Train an IC-LoRA for a joint audio+video transformation, conditioned on a reference clip's video and audio to produce a matching target.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/ic-lora/v2v-masked","name":"LTX 2.3 Trainer (V2) - Masked Video-to-Video IC-LoRA","created_by":"fal","source":"official","description":"Train an IC-LoRA that regenerates only the masked region of a video, guided by the kept pixels and a separate reference/control video.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/ic-lora/v2v-masked","tagline":"Train an IC-LoRA that regenerates only the masked region of a video, guided by the kept pixels and a separate reference/control video.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/ic-lora/v2v","name":"LTX 2.3 Trainer (V2) - Video-to-Video IC-LoRA","created_by":"fal","source":"official","description":"Train an IC-LoRA that learns a video-to-video transformation from paired before/after clips, conditioned at inference on a reference (control) video.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/ic-lora/v2v","tagline":"Train an IC-LoRA that learns a video-to-video transformation from paired before/after clips, conditioned at inference on a reference (control) video.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/inpaint","name":"LTX 2.3 Trainer (V2) - Video Inpainting","created_by":"fal","source":"official","description":"Train a LoRA that regenerates a masked region of a video while keeping the rest unchanged, blending the new content with its surroundings.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/inpaint","tagline":"Train a LoRA that regenerates a masked region of a video while keeping the rest unchanged, blending the new content with its surroundings.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/interpolate","name":"LTX 2.3 Trainer (V2) - Keyframe Interpolation","created_by":"fal","source":"official","description":"Train a LoRA that generates the video between keyframes — supply first/last (and optional middle) frames at inference and the model fills the in-between motion.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/interpolate","tagline":"Train a LoRA that generates the video between keyframes — supply first/last (and optional middle) frames at inference and the model fills the in-between motion.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/outpaint","name":"LTX 2.3 Trainer (V2) - Spatial Outpainting","created_by":"fal","source":"official","description":"Train a LoRA that expands the video frame outward, keeping an inner rectangle fixed and generating the surrounding region.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/outpaint","tagline":"Train a LoRA that expands the video frame outward, keeping an inner rectangle fixed and generating the surrounding region.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/t2a","name":"LTX 2.3 Trainer (V2) - Text-to-Audio","created_by":"fal","source":"official","description":"Train a LoRA that generates audio from a text prompt — the audio counterpart of text-to-video — learning a sound or style from your clips.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/t2a","tagline":"Train a LoRA that generates audio from a text prompt — the audio counterpart of text-to-video — learning a sound or style from your clips.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/t2v","name":"LTX 2.3 Trainer (V2) - Text-to-Video","created_by":"fal","source":"official","description":"Fine-tune LTX 2.3 on your own clips to teach it a new subject, character, object, or visual style, then generate full videos from a text prompt.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/t2v","tagline":"Fine-tune LTX 2.3 on your own clips to teach it a new subject, character, object, or visual style, then generate full videos from a text prompt.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/v2a","name":"LTX 2.3 Trainer (V2) - Video-to-Audio","created_by":"fal","source":"official","description":"Train a LoRA that generates audio (foley / sound design) for a silent video, learning a soundtrack that matches the on-screen action.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/v2a","tagline":"Train a LoRA that generates audio (foley / sound design) for a silent video, learning a soundtrack that matches the on-screen action.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/v2v-masked","name":"LTX 2.3 Trainer (V2) - Masked Video-to-Video","created_by":"fal","source":"official","description":"Train a LoRA that regenerates only the masked region of a video, guided by both the kept pixels and a separate reference/control video.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/v2v-masked","tagline":"Train a LoRA that regenerates only the masked region of a video, guided by both the kept pixels and a separate reference/control video.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/v2v","name":"LTX 2.3 Trainer (V2) - Video-to-Video","created_by":"fal","source":"official","description":"Train a LoRA that learns a video-to-video transformation from paired before/after clips, steered at inference by a reference (control) video.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/v2v","tagline":"Train a LoRA that learns a video-to-video transformation from paired before/after clips, steered at inference by a reference (control) video.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-v2v-trainer","name":"LTX-2.3 22B Video to Video Trainer","created_by":"fal","source":"official","description":"Train LTX-2.3 22B for video transformation or video-conditioned generation.","status":"active","release_date":"2026-03-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-v2v-trainer","tagline":"Train LTX-2.3 22B for video transformation or video-conditioned generation.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-video-trainer","name":"LTX-2.3 22B Video Trainer","created_by":"fal","source":"official","description":"Train LTX-2.3 22B for custom styles and effects.","status":"active","release_date":"2026-03-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-video-trainer","tagline":"Train LTX-2.3 22B for custom styles and effects.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltxv-13b-098-distilled/extend","name":"LTX-Video 13B 0.9.8 Distilled","created_by":"fal","source":"official","description":"Extend videos using LTX Video-0.9.8 13B Distilled and custom LoRA","status":"active","release_date":"2025-07-23","model_type":"other","parameters":13,"page_url":"https://fal.run/fal-ai/ltxv-13b-098-distilled/extend","tagline":"Extend videos using LTX Video-0.9.8 13B Distilled and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltxv-13b-098-distilled/image-to-video","name":"LTX-Video 13B 0.9.8 Distilled","created_by":"fal","source":"official","description":"Generate long videos from prompts and images using LTX Video-0.9.8 13B Distilled and custom LoRA","status":"active","release_date":"2025-07-17","model_type":"video","parameters":13,"page_url":"https://fal.run/fal-ai/ltxv-13b-098-distilled/image-to-video","tagline":"Generate long videos from prompts and images using LTX Video-0.9.8 13B Distilled and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltxv-13b-098-distilled/multiconditioning","name":"LTX-Video 13B 0.9.8 Distilled","created_by":"fal","source":"official","description":"Generate long videos from prompts, images, and videos using LTX Video-0.9.8 13B Distilled and custom LoRA","status":"active","release_date":"2025-07-17","model_type":"other","parameters":13,"page_url":"https://fal.run/fal-ai/ltxv-13b-098-distilled/multiconditioning","tagline":"Generate long videos from prompts, images, and videos using LTX Video-0.9.8 13B Distilled and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltxv-13b-098-distilled","name":"LTX-Video 13B 0.9.8 Distilled","created_by":"fal","source":"official","description":"Generate long videos from prompts using LTX Video-0.9.8 13B Distilled and custom LoRA","status":"active","release_date":"2025-07-17","model_type":"video","parameters":13,"page_url":"https://fal.run/fal-ai/ltxv-13b-098-distilled","tagline":"Generate long videos from prompts using LTX Video-0.9.8 13B Distilled and custom LoRA","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/lucidflux","name":"Lucidflux","created_by":"fal","source":"official","description":"LucidFlux for upscaling images with very high fidelity","status":"active","release_date":"2025-10-03","model_type":"image","page_url":"https://fal.run/fal-ai/lucidflux","tagline":"LucidFlux for upscaling images with very high fidelity","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-dream-machine/ray-2-flash/image-to-video","name":"Luma Ray 2 Flash (Image to Video)","created_by":"fal","source":"official","description":"Ray2 Flash is a fast video generative model capable of creating realistic visuals with natural, coherent motion.","status":"active","release_date":"2025-03-17","model_type":"video","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2-flash/image-to-video","tagline":"Ray2 Flash is a fast video generative model capable of creating realistic visuals with natural, coherent motion.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-dream-machine/ray-2-flash/modify","name":"Luma Ray 2 Flash Modify","created_by":"fal","source":"official","description":"Ray2 Flash Modify is a video generative model capable of restyling or retexturing the entire shot, from turning live-action into CG or stylized animation, to changing wardrobe, props, or the overall a","status":"active","release_date":"2025-07-17","model_type":"other","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2-flash/modify","tagline":"Ray2 Flash Modify is a video generative model capable of restyling or retexturing the entire shot, from turning live-action into CG or stylized animation, to changing wardrobe, props, or the overall a","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/luma-dream-machine/ray-2-flash/reframe","name":"Luma Ray 2 Flash Reframe","created_by":"fal","source":"official","description":"Adjust and enhance videos with Ray-2 Reframe.","status":"active","release_date":"2025-06-03","model_type":"other","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2-flash/reframe","tagline":"Adjust and enhance videos with Ray-2 Reframe.","capabilities":{"tool_call":true},"tools":["function_calling"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-dream-machine/ray-2-flash","name":"Luma Ray 2 Flash","created_by":"fal","source":"official","description":"Ray2 Flash is a fast video generative model capable of creating realistic visuals with natural, coherent motion.","status":"active","release_date":"2025-03-17","model_type":"video","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2-flash","tagline":"Ray2 Flash is a fast video generative model capable of creating realistic visuals with natural, coherent motion.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-dream-machine/ray-2/image-to-video","name":"Luma Ray 2 (Image to Video)","created_by":"fal","source":"official","description":"Ray2 is a large-scale video generative model capable of creating realistic visuals with natural, coherent motion.","status":"active","release_date":"2025-02-14","model_type":"video","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2/image-to-video","tagline":"Ray2 is a large-scale video generative model capable of creating realistic visuals with natural, coherent motion.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-dream-machine/ray-2/modify","name":"Luma Ray 2 Modify","created_by":"fal","source":"official","description":"Ray2 Modify is a video generative model capable of restyling or retexturing the entire shot, from turning live-action into CG or stylized animation, to changing wardrobe, props, or the overall aesthet","status":"active","release_date":"2025-06-28","model_type":"other","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2/modify","tagline":"Ray2 Modify is a video generative model capable of restyling or retexturing the entire shot, from turning live-action into CG or stylized animation, to changing wardrobe, props, or the overall aesthet","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-dream-machine/ray-2/reframe","name":"Luma Ray 2 Reframe","created_by":"fal","source":"official","description":"Adjust and enhance videos with Ray-2 Reframe.","status":"active","release_date":"2025-06-03","model_type":"other","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2/reframe","tagline":"Adjust and enhance videos with Ray-2 Reframe.","capabilities":{"tool_call":true},"tools":["function_calling"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-dream-machine/ray-2","name":"Luma Ray 2","created_by":"fal","source":"official","description":"Ray2 is a large-scale video generative model capable of creating realistic visuals with natural, coherent motion.","status":"active","release_date":"2025-01-27","model_type":"video","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2","tagline":"Ray2 is a large-scale video generative model capable of creating realistic visuals with natural, coherent motion.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-photon/flash/modify","name":"Luma Photon","created_by":"fal","source":"official","description":"Edit images from your prompts using Luma Photon.","status":"active","release_date":"2025-06-08","model_type":"image","page_url":"https://fal.run/fal-ai/luma-photon/flash/modify","tagline":"Edit images from your prompts using Luma Photon.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-photon/flash/reframe","name":"Luma Photon Flash Reframe","created_by":"fal","source":"official","description":"This advanced tool intelligently expands your visuals, seamlessly blending new content to enhance creativity and adaptability, offering unmatched speed and quality for creators at a fraction of the co","status":"active","release_date":"2025-06-03","model_type":"image","page_url":"https://fal.run/fal-ai/luma-photon/flash/reframe","tagline":"This advanced tool intelligently expands your visuals, seamlessly blending new content to enhance creativity and adaptability, offering unmatched speed and quality for creators at a fraction of the co","capabilities":{"vision":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"tools":["function_calling"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-photon/flash","name":"Luma Photon Flash","created_by":"fal","source":"official","description":"Generate images from your prompts using Luma Photon Flash.","status":"active","release_date":"2024-12-03","model_type":"image","page_url":"https://fal.run/fal-ai/luma-photon/flash","tagline":"Generate images from your prompts using Luma Photon Flash.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-photon/modify","name":"Luma Photon","created_by":"fal","source":"official","description":"Edit images from your prompts using Luma Photon.","status":"active","release_date":"2025-06-08","model_type":"image","page_url":"https://fal.run/fal-ai/luma-photon/modify","tagline":"Edit images from your prompts using Luma Photon.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-photon/reframe","name":"Luma Photon Reframe","created_by":"fal","source":"official","description":"Extend and reframe images with Luma Photon Reframe.","status":"active","release_date":"2025-06-03","model_type":"image","page_url":"https://fal.run/fal-ai/luma-photon/reframe","tagline":"Extend and reframe images with Luma Photon Reframe.","capabilities":{"vision":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"tools":["function_calling"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-photon","name":"Luma Photon","created_by":"fal","source":"official","description":"Generate images from your prompts using Luma Photon.","status":"active","release_date":"2024-06-03","model_type":"image","page_url":"https://fal.run/fal-ai/luma-photon","tagline":"Generate images from your prompts using Luma Photon.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/lumina-image/v2","name":"Lumina Image 2","created_by":"fal","source":"official","description":"Lumina-Image-2.0 is a 2 billion parameter flow-based diffusion transforer which features improved performance in image quality, typography, complex prompt understanding, and resource-efficiency.","status":"active","release_date":"2025-01-31","model_type":"image","page_url":"https://fal.run/fal-ai/lumina-image/v2","tagline":"Lumina-Image-2.0 is a 2 billion parameter flow-based diffusion transforer which features improved performance in image quality, typography, complex prompt understanding, and resource-efficiency.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/lux-tts","name":"Lux TTS","created_by":"fal","source":"official","description":"High-quality voice cloning TTS model that generates 48kHz speech from text and a reference audio.","status":"active","release_date":"2026-03-12","model_type":"tts","page_url":"https://fal.run/fal-ai/lux-tts","tagline":"High-quality voice cloning TTS model that generates 48kHz speech from text and a reference audio.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-03-12","last_updated":"2026-05-11"},{"id":"fal-ai/lyra-2/zoom","name":"Lyra 2","created_by":"fal","source":"official","description":"Lyra 2.0 is an image-to-video model that turns a single image into an explorable 3D-style video with camera-controlled motion.","status":"active","release_date":"2026-04-21","model_type":"video","page_url":"https://fal.run/fal-ai/lyra-2/zoom","tagline":"Lyra 2.0 is an image-to-video model that turns a single image into an explorable 3D-style video with camera-controlled motion.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/lyria2","name":"Lyria2","created_by":"fal","source":"official","description":"Lyria 2 is Google's latest music generation model, you can generate any type of music with this model.","status":"active","release_date":"2025-05-20","model_type":"other","page_url":"https://fal.run/fal-ai/lyria2","tagline":"Lyria 2 is Google's latest music generation model, you can generate any type of music with this model.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/lyria3/pro","name":"Lyria 3 Pro","created_by":"fal","source":"official","description":"Lyria 3 Pro is the latest music model from Google","status":"active","release_date":"2026-05-20","model_type":"other","page_url":"https://fal.run/fal-ai/lyria3/pro","tagline":"Lyria 3 Pro is the latest music model from Google","last_seen_at":"2026-05-26","last_updated":"2026-06-03"},{"id":"fal-ai/lyria3","name":"Lyria3","created_by":"fal","source":"official","description":"Lyria 3 is most recent music model from Google","status":"active","release_date":"2026-03-30","model_type":"other","page_url":"https://fal.run/fal-ai/lyria3","tagline":"Lyria 3 is most recent music model from Google","last_seen_at":"2026-05-22","last_updated":"2026-06-03"},{"id":"fal-ai/magi-distilled/extend-video","name":"MAGI-1 (Distilled)","created_by":"fal","source":"official","description":"MAGI-1 distilled extends videos faster with an exceptional understanding of physical interactions and prompts","status":"active","release_date":"2025-04-23","model_type":"other","page_url":"https://fal.run/fal-ai/magi-distilled/extend-video","tagline":"MAGI-1 distilled extends videos faster with an exceptional understanding of physical interactions and prompts","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/magi-distilled/image-to-video","name":"MAGI-1 (Distilled)","created_by":"fal","source":"official","description":"MAGI-1 distilled generates videos faster from images with exceptional understanding of physical interactions and prompting","status":"active","release_date":"2025-04-23","model_type":"video","page_url":"https://fal.run/fal-ai/magi-distilled/image-to-video","tagline":"MAGI-1 distilled generates videos faster from images with exceptional understanding of physical interactions and prompting","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/magi-distilled","name":"MAGI-1 (Distilled)","created_by":"fal","source":"official","description":"MAGI-1 distilled is a faster video generation model with exceptional understanding of physical interactions and cinematic prompts","status":"active","release_date":"2025-04-22","model_type":"video","page_url":"https://fal.run/fal-ai/magi-distilled","tagline":"MAGI-1 distilled is a faster video generation model with exceptional understanding of physical interactions and cinematic prompts","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/magi/extend-video","name":"MAGI-1","created_by":"fal","source":"official","description":"MAGI-1 extends videos with an exceptional understanding of physical interactions and prompts","status":"active","release_date":"2025-04-23","model_type":"other","page_url":"https://fal.run/fal-ai/magi/extend-video","tagline":"MAGI-1 extends videos with an exceptional understanding of physical interactions and prompts","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/magi/image-to-video","name":"MAGI-1","created_by":"fal","source":"official","description":"MAGI-1 generates videos from images with exceptional understanding of physical interactions and prompting","status":"active","release_date":"2025-04-23","model_type":"video","page_url":"https://fal.run/fal-ai/magi/image-to-video","tagline":"MAGI-1 generates videos from images with exceptional understanding of physical interactions and prompting","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/magi","name":"MAGI-1","created_by":"fal","source":"official","description":"MAGI-1 is a video generation model with exceptional understanding of physical interactions and cinematic prompts","status":"active","release_date":"2025-04-23","model_type":"video","page_url":"https://fal.run/fal-ai/magi","tagline":"MAGI-1 is a video generation model with exceptional understanding of physical interactions and cinematic prompts","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/marlin/find","name":"Marlin Find","created_by":"fal","source":"official","description":"Marlin is a 2B video VLM tuned for the two questions developers actually want to ask of their videos: what is happening, and when?","status":"active","release_date":"2026-05-21","model_type":"other","page_url":"https://fal.run/fal-ai/marlin/find","tagline":"Marlin is a 2B video VLM tuned for the two questions developers actually want to ask of their videos: what is happening, and when?","capabilities":{"vision":true},"last_seen_at":"2026-05-21","last_updated":"2026-06-03"},{"id":"fal-ai/marlin","name":"Marlin","created_by":"fal","source":"official","description":"Marlin is a 2B video VLM tuned for the two questions developers actually want to ask of their videos: what is happening, and when?","status":"active","release_date":"2026-05-21","model_type":"other","page_url":"https://fal.run/fal-ai/marlin","tagline":"Marlin is a 2B video VLM tuned for the two questions developers actually want to ask of their videos: what is happening, and when?","capabilities":{"vision":true},"last_seen_at":"2026-05-21","last_updated":"2026-06-03"},{"id":"fal-ai/maya/batch","name":"Maya","created_by":"fal","source":"official","description":"Maya1 is a state-of-the-art speech model by Maya Research for expressive voice generation, built to capture real human emotion and precise voice design.","status":"active","release_date":"2025-12-12","model_type":"tts","page_url":"https://fal.run/fal-ai/maya/batch","tagline":"Maya1 is a state-of-the-art speech model by Maya Research for expressive voice generation, built to capture real human emotion and precise voice design.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/maya/stream","name":"Maya","created_by":"fal","source":"official","description":"Maya1 is a state-of-the-art speech model by Maya Research for expressive voice generation, built to capture real human emotion and precise voice design.","status":"active","release_date":"2025-12-12","model_type":"tts","page_url":"https://fal.run/fal-ai/maya/stream","tagline":"Maya1 is a state-of-the-art speech model by Maya Research for expressive voice generation, built to capture real human emotion and precise voice design.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/maya","name":"Maya1","created_by":"fal","source":"official","description":"Maya1 is a state-of-the-art speech model by Maya Research for expressive voice generation, built to capture real human emotion and precise voice design.","status":"active","release_date":"2025-11-15","model_type":"tts","page_url":"https://fal.run/fal-ai/maya","tagline":"Maya1 is a state-of-the-art speech model by Maya Research for expressive voice generation, built to capture real human emotion and precise voice design.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/meshy/rigging/multi-animation","name":"Meshy Rigging Multi Animation","created_by":"fal","source":"official","description":"Meshy auto-rigs a humanoid 3D model fitting a skeleton and binding the mesh, then applies several motion presets from its animation library","status":"active","release_date":"2026-06-12","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/rigging/multi-animation","tagline":"Meshy auto-rigs a humanoid 3D model fitting a skeleton and binding the mesh, then applies several motion presets from its animation library","last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/rigging","name":"Meshy Rigging","created_by":"fal","source":"official","description":"Rig humanoid 3D models from GLB URLs with Meshy, returning rigged GLB/FBX files plus basic animations.","status":"active","release_date":"2026-05-19","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/rigging","tagline":"Rig humanoid 3D models from GLB URLs with Meshy, returning rigged GLB/FBX files plus basic animations.","last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v5/multi-image-to-3d","name":"Meshy 5 Multi","created_by":"fal","source":"official","description":"Meshy-5 multi image generates realistic and production ready 3D models from multiple images.","status":"active","release_date":"2025-10-06","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v5/multi-image-to-3d","tagline":"Meshy-5 multi image generates realistic and production ready 3D models from multiple images.","capabilities":{"vision":true},"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v5/remesh","name":"Meshy 5 Remesh","created_by":"fal","source":"official","description":"Meshy-5 remesh allows you to remesh and export existing 3D models into various formats","status":"active","release_date":"2025-10-18","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v5/remesh","tagline":"Meshy-5 remesh allows you to remesh and export existing 3D models into various formats","last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v5/retexture","name":"Meshy 5 Retexture","created_by":"fal","source":"official","description":"Meshy-5 retexture applies new, high-quality textures to existing 3D models using either text prompts or reference images.","status":"active","release_date":"2025-10-18","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v5/retexture","tagline":"Meshy-5 retexture applies new, high-quality textures to existing 3D models using either text prompts or reference images.","capabilities":{"vision":true},"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v6/image-to-3d","name":"Meshy 6","created_by":"fal","source":"official","description":"Meshy-6 is the latest model from Meshy.","status":"active","release_date":"2026-02-09","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v6/image-to-3d","tagline":"Meshy-6 is the latest model from Meshy.","capabilities":{"vision":true},"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v6/multi-image-to-3d","name":"Meshy 6 - Multi Image To 3D","created_by":"fal","source":"official","description":"Meshy-6 is the latest model from Meshy.","status":"active","release_date":"2026-04-23","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v6/multi-image-to-3d","tagline":"Meshy-6 is the latest model from Meshy.","capabilities":{"vision":true},"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v6-preview/image-to-3d","name":"Meshy 6 Preview","created_by":"fal","source":"official","description":"Meshy-6-Preview is the latest model from Meshy.","status":"active","release_date":"2025-10-06","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v6-preview/image-to-3d","tagline":"Meshy-6-Preview is the latest model from Meshy.","capabilities":{"vision":true},"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v6-preview/text-to-3d","name":"Meshy 6 Preview","created_by":"fal","source":"official","description":"Meshy-6-Preview is the latest model from Meshy.","status":"active","release_date":"2025-10-06","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v6-preview/text-to-3d","tagline":"Meshy-6-Preview is the latest model from Meshy.","last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v6/text-to-3d","name":"Meshy 6","created_by":"fal","source":"official","description":"Meshy-6 is the latest model from Meshy.","status":"active","release_date":"2026-02-09","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v6/text-to-3d","tagline":"Meshy-6 is the latest model from Meshy.","last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/minimax/hailuo-02-fast/image-to-video","name":"Minimax","created_by":"fal","source":"official","family":"minimax","description":"Create blazing fast and economical videos with MiniMax Hailuo-02 Image To Video API at 512p resolution","status":"active","release_date":"2025-08-06","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-02-fast/image-to-video","tagline":"Create blazing fast and economical videos with MiniMax Hailuo-02 Image To Video API at 512p resolution","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/minimax/hailuo-02/pro/image-to-video","name":"MiniMax Hailuo 02 [Pro] (Image to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-02 Image To Video API (Pro, 1080p): Advanced image-to-video generation model with 1080p resolution","status":"active","release_date":"2025-06-18","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-02/pro/image-to-video","tagline":"MiniMax Hailuo-02 Image To Video API (Pro, 1080p): Advanced image-to-video generation model with 1080p resolution","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-02/pro/text-to-video","name":"MiniMax Hailuo 02 [Pro] (Text to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-02 Text To Video API (Pro, 1080p): Advanced video generation model with 1080p resolution","status":"active","release_date":"2025-06-18","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-02/pro/text-to-video","tagline":"MiniMax Hailuo-02 Text To Video API (Pro, 1080p): Advanced video generation model with 1080p resolution","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-02/standard/image-to-video","name":"MiniMax Hailuo 02 [Standard] (Image to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-02 Image To Video API (Standard, 768p, 512p): Advanced image-to-video generation model with 768p and 512p resolutions","status":"active","release_date":"2025-06-18","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-02/standard/image-to-video","tagline":"MiniMax Hailuo-02 Image To Video API (Standard, 768p, 512p): Advanced image-to-video generation model with 768p and 512p resolutions","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-02/standard/text-to-video","name":"MiniMax Hailuo 02 [Standard] (Text to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-02 Text To Video API (Standard, 768p): Advanced video generation model with 768p resolution","status":"active","release_date":"2025-06-18","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-02/standard/text-to-video","tagline":"MiniMax Hailuo-02 Text To Video API (Standard, 768p): Advanced video generation model with 768p resolution","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-2.3-fast/pro/image-to-video","name":"MiniMax Hailuo 2.3 Fast [Pro] (Image to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-2.3-Fast Image To Video API (Pro, 1080p): Advanced fast image-to-video generation model with 1080p resolution","status":"active","release_date":"2025-10-27","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-2.3-fast/pro/image-to-video","tagline":"MiniMax Hailuo-2.3-Fast Image To Video API (Pro, 1080p): Advanced fast image-to-video generation model with 1080p resolution","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-2.3-fast/standard/image-to-video","name":"MiniMax Hailuo 2.3 Fast [Standard] (Image to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-2.3-Fast Image To Video API (Standard, 768p): Advanced fast image-to-video generation model with 768p resolution","status":"active","release_date":"2025-10-27","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-2.3-fast/standard/image-to-video","tagline":"MiniMax Hailuo-2.3-Fast Image To Video API (Standard, 768p): Advanced fast image-to-video generation model with 768p resolution","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-2.3/pro/image-to-video","name":"MiniMax Hailuo 2.3 [Pro] (Image to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-2.3 Image To Video API (Pro, 1080p): Advanced image-to-video generation model with 1080p resolution","status":"active","release_date":"2025-10-27","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-2.3/pro/image-to-video","tagline":"MiniMax Hailuo-2.3 Image To Video API (Pro, 1080p): Advanced image-to-video generation model with 1080p resolution","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-2.3/pro/text-to-video","name":"MiniMax Hailuo 2.3 [Pro] (Text to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-2.3 Text To Video API (Pro, 1080p): Advanced text-to-video generation model with 1080p resolution","status":"active","release_date":"2025-10-27","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-2.3/pro/text-to-video","tagline":"MiniMax Hailuo-2.3 Text To Video API (Pro, 1080p): Advanced text-to-video generation model with 1080p resolution","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-2.3/standard/image-to-video","name":"MiniMax Hailuo 2.3 [Standard] (Image to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-2.3 Image To Video API (Standard, 768p): Advanced image-to-video generation model with 768p resolution","status":"active","release_date":"2025-10-27","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-2.3/standard/image-to-video","tagline":"MiniMax Hailuo-2.3 Image To Video API (Standard, 768p): Advanced image-to-video generation model with 768p resolution","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-2.3/standard/text-to-video","name":"MiniMax Hailuo 2.3 [Standard] (Text to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-2.3 Text To Video API (Standard, 768p): Advanced text-to-video generation model with 768p resolution","status":"active","release_date":"2025-10-27","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-2.3/standard/text-to-video","tagline":"MiniMax Hailuo-2.3 Text To Video API (Standard, 768p): Advanced text-to-video generation model with 768p resolution","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/image-01/subject-reference","name":"Minimax Image Subject Reference","created_by":"fal","source":"official","family":"minimax","description":"Generate images from text and a reference image using MiniMax Image-01 for consistent character appearance.","status":"active","release_date":"2025-05-06","model_type":"image","page_url":"https://fal.run/fal-ai/minimax/image-01/subject-reference","tagline":"Generate images from text and a reference image using MiniMax Image-01 for consistent character appearance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/image-01","name":"MiniMax (Hailuo AI) Text to Image","created_by":"fal","source":"official","family":"minimax","description":"Generate high quality images from text prompts using MiniMax Image-01.","status":"active","release_date":"2025-05-06","model_type":"image","page_url":"https://fal.run/fal-ai/minimax/image-01","tagline":"Generate high quality images from text prompts using MiniMax Image-01.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax-music/v1.5","name":"MiniMax (Hailuo AI) Music v1.5","created_by":"fal","source":"official","family":"minimax","description":"Generate music from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality, diverse musical compositions.","status":"active","release_date":"2025-09-11","model_type":"other","page_url":"https://fal.run/fal-ai/minimax-music/v1.5","tagline":"Generate music from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality, diverse musical compositions.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/minimax-music/v2.5","name":"Minimax Music 2.5","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Music 2.5 creates complete tracks with singing, backing music, and detailed arrangements from lyrics and a style description.","status":"active","release_date":"2026-04-11","model_type":"other","page_url":"https://fal.run/fal-ai/minimax-music/v2.5","tagline":"MiniMax Music 2.5 creates complete tracks with singing, backing music, and detailed arrangements from lyrics and a style description.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax-music/v2.6","name":"Minimax Music 2.6","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Music 2.6 creates complete tracks with singing, backing music, and detailed arrangements from lyrics and a style description.","status":"active","release_date":"2026-04-11","model_type":"other","page_url":"https://fal.run/fal-ai/minimax-music/v2.6","tagline":"MiniMax Music 2.6 creates complete tracks with singing, backing music, and detailed arrangements from lyrics and a style description.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax-music/v2","name":"Minimax Music","created_by":"fal","source":"official","family":"minimax","description":"Generate music from text prompts using the MiniMax Music 2.0 model, which leverages advanced AI techniques to create high-quality, diverse musical compositions.","status":"active","release_date":"2025-10-30","model_type":"other","page_url":"https://fal.run/fal-ai/minimax-music/v2","tagline":"Generate music from text prompts using the MiniMax Music 2.0 model, which leverages advanced AI techniques to create high-quality, diverse musical compositions.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax-music","name":"MiniMax (Hailuo AI) Music","created_by":"fal","source":"official","family":"minimax","description":"Generate music from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality, diverse musical compositions.","status":"active","release_date":"2024-12-17","model_type":"other","page_url":"https://fal.run/fal-ai/minimax-music","tagline":"Generate music from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality, diverse musical compositions.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/minimax/preview/speech-2.5-hd","name":"Minimax","created_by":"fal","source":"official","family":"minimax","description":"Generate speech from text prompts and different voices using the MiniMax Speech-02 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-08-11","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/preview/speech-2.5-hd","tagline":"Generate speech from text prompts and different voices using the MiniMax Speech-02 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/minimax/preview/speech-2.5-turbo","name":"Minimax","created_by":"fal","source":"official","family":"minimax","description":"Generate fast speech from text prompts and different voices using the MiniMax Speech-02 Turbo model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-08-11","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/preview/speech-2.5-turbo","tagline":"Generate fast speech from text prompts and different voices using the MiniMax Speech-02 Turbo model, which leverages advanced AI techniques to create high-quality text-to-speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/minimax/speech-02-hd","name":"MiniMax Speech-02 HD","created_by":"fal","source":"official","family":"minimax","description":"Generate speech from text prompts and different voices using the MiniMax Speech-02 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-05-06","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/speech-02-hd","tagline":"Generate speech from text prompts and different voices using the MiniMax Speech-02 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/minimax/speech-02-turbo","name":"MiniMax Speech-02 Turbo","created_by":"fal","source":"official","family":"minimax","description":"Generate fast speech from text prompts and different voices using the MiniMax Speech-02 Turbo model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-05-06","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/speech-02-turbo","tagline":"Generate fast speech from text prompts and different voices using the MiniMax Speech-02 Turbo model, which leverages advanced AI techniques to create high-quality text-to-speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/minimax/speech-2.6-hd","name":"MiniMax Speech 2.6 [HD]","created_by":"fal","source":"official","family":"minimax","description":"Generate speech from text prompts and different voices using the MiniMax Speech-2.6 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-10-29","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/speech-2.6-hd","tagline":"Generate speech from text prompts and different voices using the MiniMax Speech-2.6 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/speech-2.6-turbo","name":"MiniMax Speech 2.6 [Turbo]","created_by":"fal","source":"official","family":"minimax","description":"Generate speech from text prompts and different voices using the MiniMax Speech-2.6 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-10-29","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/speech-2.6-turbo","tagline":"Generate speech from text prompts and different voices using the MiniMax Speech-2.6 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/speech-2.8-hd","name":"MiniMax Speech 2.8 [HD]","created_by":"fal","source":"official","family":"minimax","description":"Generate speech from text prompts and different voices using the MiniMax Speech-2.8 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2026-02-04","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/speech-2.8-hd","tagline":"Generate speech from text prompts and different voices using the MiniMax Speech-2.8 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/speech-2.8-turbo","name":"MiniMax Speech 2.8 [Turbo]","created_by":"fal","source":"official","family":"minimax","description":"Generate speech from text prompts and different voices using the MiniMax Speech-2.8 Turbo model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2026-02-04","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/speech-2.8-turbo","tagline":"Generate speech from text prompts and different voices using the MiniMax Speech-2.8 Turbo model, which leverages advanced AI techniques to create high-quality text-to-speech.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/video-01-director/image-to-video","name":"MiniMax (Hailuo AI) Video 01 Director - Image to Video","created_by":"fal","source":"official","family":"minimax","description":"Generate video clips more accurately with respect to initial image, natural language descriptions, and using camera movement instructions for shot control.","status":"active","release_date":"2025-02-24","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/video-01-director/image-to-video","tagline":"Generate video clips more accurately with respect to initial image, natural language descriptions, and using camera movement instructions for shot control.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/video-01-director","name":"MiniMax (Hailuo AI) Video 01 Director","created_by":"fal","source":"official","family":"minimax","description":"Generate video clips more accurately with respect to natural language descriptions and using camera movement instructions for shot control.","status":"active","release_date":"2025-02-11","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/video-01-director","tagline":"Generate video clips more accurately with respect to natural language descriptions and using camera movement instructions for shot control.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/video-01/image-to-video","name":"MiniMax (Hailuo AI) Video 01","created_by":"fal","source":"official","family":"minimax","description":"Generate video clips from your images using MiniMax Video model","status":"active","release_date":"2024-10-30","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/video-01/image-to-video","tagline":"Generate video clips from your images using MiniMax Video model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/video-01-live/image-to-video","name":"MiniMax (Hailuo AI) Video 01","created_by":"fal","source":"official","family":"minimax","description":"Generate video clips from your images using MiniMax Video model","status":"active","release_date":"2024-12-16","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/video-01-live/image-to-video","tagline":"Generate video clips from your images using MiniMax Video model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/video-01-live","name":"MiniMax (Hailuo AI) Video 01 Live","created_by":"fal","source":"official","family":"minimax","description":"Generate video clips from your prompts using MiniMax model","status":"active","release_date":"2024-12-16","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/video-01-live","tagline":"Generate video clips from your prompts using MiniMax model","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/video-01-subject-reference","name":"MiniMax (Hailuo AI) Video 01 Subject Reference","created_by":"fal","source":"official","family":"minimax","description":"Generate video clips maintaining consistent, realistic facial features and identity across dynamic video content","status":"active","release_date":"2025-01-20","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/video-01-subject-reference","tagline":"Generate video clips maintaining consistent, realistic facial features and identity across dynamic video content","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/video-01","name":"MiniMax (Hailuo AI) Video 01","created_by":"fal","source":"official","family":"minimax","description":"Generate video clips from your prompts using MiniMax model","status":"active","release_date":"2024-02-13","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/video-01","tagline":"Generate video clips from your prompts using MiniMax model","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/voice-clone","name":"MiniMax Voice Cloning","created_by":"fal","source":"official","family":"minimax","description":"Clone a voice from a sample audio and generate speech from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-05-06","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/voice-clone","tagline":"Clone a voice from a sample audio and generate speech from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality text-to-speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/voice-design","name":"MiniMax Voice Design","created_by":"fal","source":"official","family":"minimax","description":"Design a personalized voice from a text description, and generate speech from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-07-18","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/voice-design","tagline":"Design a personalized voice from a text description, and generate speech from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality text-to-speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/mix-dehaze-net","name":"MixDehazer","created_by":"fal","source":"official","description":"An advanced dehaze model to remove atmospheric haze, restoring clarity and detail in images through intelligent neural network processing.","status":"active","release_date":"2025-03-24","model_type":"image","page_url":"https://fal.run/fal-ai/mix-dehaze-net","tagline":"An advanced dehaze model to remove atmospheric haze, restoring clarity and detail in images through intelligent neural network processing.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/mmaudio-v2/text-to-audio","name":"MMAudio V2 Text to Audio","created_by":"fal","source":"official","description":"MMAudio generates synchronized audio given text inputs.","status":"active","release_date":"2024-12-20","model_type":"other","page_url":"https://fal.run/fal-ai/mmaudio-v2/text-to-audio","tagline":"MMAudio generates synchronized audio given text inputs.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/mmaudio-v2","name":"MMAudio V2","created_by":"fal","source":"official","description":"MMAudio generates synchronized audio given video and/or text inputs.","status":"active","release_date":"2024-12-12","model_type":"other","page_url":"https://fal.run/fal-ai/mmaudio-v2","tagline":"MMAudio generates synchronized audio given video and/or text inputs.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/mochi-v1","name":"Mochi 1","created_by":"fal","source":"official","description":"Mochi 1 preview is an open state-of-the-art video generation model with high-fidelity motion and strong prompt adherence in preliminary evaluation.","status":"active","release_date":"2024-11-07","model_type":"video","page_url":"https://fal.run/fal-ai/mochi-v1","tagline":"Mochi 1 preview is an open state-of-the-art video generation model with high-fidelity motion and strong prompt adherence in preliminary evaluation.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/moondream/batched","name":"Moondream","created_by":"fal","source":"official","description":"Answer questions from the images.","status":"active","release_date":"2024-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/moondream/batched","tagline":"Answer questions from the images.","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/moondream-next/batch","name":"MoonDreamNext Batch","created_by":"fal","source":"official","description":"MoonDreamNext Batch is a multimodal vision-language model for batch captioning.","status":"active","release_date":"2025-01-17","model_type":"other","page_url":"https://fal.run/fal-ai/moondream-next/batch","tagline":"MoonDreamNext Batch is a multimodal vision-language model for batch captioning.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream-next/detection","name":"MoonDreamNext Detection","created_by":"fal","source":"official","description":"MoonDreamNext Detection is a multimodal vision-language model for gaze detection, bbox detection, point detection, and more.","status":"active","release_date":"2025-01-09","model_type":"image","page_url":"https://fal.run/fal-ai/moondream-next/detection","tagline":"MoonDreamNext Detection is a multimodal vision-language model for gaze detection, bbox detection, point detection, and more.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream-next","name":"MoonDreamNext","created_by":"fal","source":"official","description":"MoonDreamNext is a multimodal vision-language model for captioning, gaze detection, bbox detection, point detection, and more.","status":"active","release_date":"2025-01-09","model_type":"other","page_url":"https://fal.run/fal-ai/moondream-next","tagline":"MoonDreamNext is a multimodal vision-language model for captioning, gaze detection, bbox detection, point detection, and more.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream2/object-detection","name":"Moondream2","created_by":"fal","source":"official","description":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","status":"active","release_date":"2025-04-26","model_type":"other","page_url":"https://fal.run/fal-ai/moondream2/object-detection","tagline":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream2/point-object-detection","name":"Moondream2","created_by":"fal","source":"official","description":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","status":"active","release_date":"2025-04-26","model_type":"other","page_url":"https://fal.run/fal-ai/moondream2/point-object-detection","tagline":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream2/visual-query","name":"Moondream2","created_by":"fal","source":"official","description":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","status":"active","release_date":"2025-04-26","model_type":"other","page_url":"https://fal.run/fal-ai/moondream2/visual-query","tagline":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream2","name":"Moondream2","created_by":"fal","source":"official","description":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","status":"active","release_date":"2025-04-26","model_type":"other","page_url":"https://fal.run/fal-ai/moondream2","tagline":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream3-preview/caption","name":"Moondream3 Preview [Caption]","created_by":"fal","source":"official","description":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","status":"active","release_date":"2025-10-09","model_type":"other","page_url":"https://fal.run/fal-ai/moondream3-preview/caption","tagline":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","capabilities":{"vision":true,"reasoning":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream3-preview/detect","name":"Moondream3 Preview [Detect]","created_by":"fal","source":"official","description":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","status":"active","release_date":"2025-10-09","model_type":"other","page_url":"https://fal.run/fal-ai/moondream3-preview/detect","tagline":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","capabilities":{"vision":true,"reasoning":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream3-preview/point","name":"Moondream3 Preview [Point]","created_by":"fal","source":"official","description":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","status":"active","release_date":"2025-10-09","model_type":"other","page_url":"https://fal.run/fal-ai/moondream3-preview/point","tagline":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","capabilities":{"vision":true,"reasoning":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream3-preview/query","name":"Moondream 3 Preview [Query]","created_by":"fal","source":"official","description":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","status":"active","release_date":"2025-10-09","model_type":"other","page_url":"https://fal.run/fal-ai/moondream3-preview/query","tagline":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","capabilities":{"vision":true,"reasoning":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream3-preview/segment","name":"Moondream3 Preview [Segment]","created_by":"fal","source":"official","description":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive inference at scale.","status":"active","release_date":"2025-12-12","model_type":"image","page_url":"https://fal.run/fal-ai/moondream3-preview/segment","tagline":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","capabilities":{"vision":true,"reasoning":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/multishot-master","name":"Multishot Master","created_by":"fal","source":"official","description":"MultiShotMaster is a controllable multi-shot narrative video generation framework that supports text-driven inter-shot consistency, variable shot counts and shot durations, customized subject with mot","status":"active","release_date":"2026-02-24","model_type":"video","page_url":"https://fal.run/fal-ai/multishot-master","tagline":"MultiShotMaster is a controllable multi-shot narrative video generation framework that supports text-driven inter-shot consistency, variable shot counts and shot durations, customized subject with mot","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/musetalk","name":"MuseTalk","created_by":"fal","source":"official","description":"MuseTalk is a real-time high quality audio-driven lip-syncing model.","status":"active","release_date":"2024-04-11","model_type":"video","page_url":"https://fal.run/fal-ai/musetalk","tagline":"MuseTalk is a real-time high quality audio-driven lip-syncing model.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/nafnet/deblur","name":"NAFNet-deblur","created_by":"fal","source":"official","description":"Use NAFNet to fix issues like blurriness and noise in your images.","status":"active","release_date":"2025-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/nafnet/deblur","tagline":"Use NAFNet to fix issues like blurriness and noise in your images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/nafnet/denoise","name":"NAFNet-denoise","created_by":"fal","source":"official","description":"Use NAFNet to fix issues like blurriness and noise in your images.","status":"active","release_date":"2025-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/nafnet/denoise","tagline":"Use NAFNet to fix issues like blurriness and noise in your images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/nano-banana-2/edit","name":"Nano Banana 2","created_by":"fal","source":"official","description":"Nano Banana 2 is Google's new state-of-the-art image generation and editing model\n","status":"active","release_date":"2026-02-26","model_type":"image","page_url":"https://fal.run/fal-ai/nano-banana-2/edit","tagline":"Nano Banana 2 is Google's new state-of-the-art image generation and editing model\n","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/nano-banana-2","name":"Nano Banana 2","created_by":"fal","source":"official","description":"Nano Banana 2 is Google's new state-of-the-art fast image generation and editing model","status":"active","release_date":"2026-02-26","model_type":"image","page_url":"https://fal.run/fal-ai/nano-banana-2","tagline":"Nano Banana 2 is Google's new state-of-the-art fast image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-11","last_updated":"2026-06-18"},{"id":"fal-ai/nano-banana/edit","name":"Nano Banana","created_by":"fal","source":"official","description":"Google's famous original image generation and editing model","status":"active","release_date":"2025-08-19","model_type":"image","page_url":"https://fal.run/fal-ai/nano-banana/edit","tagline":"Google's famous original image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-26","last_updated":"2026-06-29"},{"id":"fal-ai/nano-banana-pro/edit","name":"Nano Banana Pro","created_by":"fal","source":"official","description":"Nano Banana Pro is Google's new state-of-the-art image generation and editing model","status":"active","release_date":"2025-11-20","model_type":"image","page_url":"https://fal.run/fal-ai/nano-banana-pro/edit","tagline":"Nano Banana Pro is Google's new state-of-the-art image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-18","last_updated":"2026-06-20"},{"id":"fal-ai/nano-banana-pro","name":"Nano Banana Pro","created_by":"fal","source":"official","description":"Nano Banana Pro is Google's new state-of-the-art image generation and editing model","status":"active","release_date":"2025-11-20","model_type":"image","page_url":"https://fal.run/fal-ai/nano-banana-pro","tagline":"Nano Banana Pro is Google's new state-of-the-art image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/nano-banana","name":"Nano Banana","created_by":"fal","source":"official","description":"Google's famous original image generation and editing model","status":"active","release_date":"2025-08-19","model_type":"image","page_url":"https://fal.run/fal-ai/nano-banana","tagline":"Google's famous original image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/nemotron-diffusion-vlm","name":"Nemotron Diffusion Vlm","created_by":"fal","source":"official","description":"Nemotron-Labs-Diffusion-VLM-8B is the vision-language extension of the Nemotron-Labs-Diffusion family.","status":"active","release_date":"2026-05-21","model_type":"other","page_url":"https://fal.run/fal-ai/nemotron-diffusion-vlm","tagline":"Nemotron-Labs-Diffusion-VLM-8B is the vision-language extension of the Nemotron-Labs-Diffusion family.","capabilities":{"vision":true},"last_seen_at":"2026-05-21","last_updated":"2026-06-03"},{"id":"fal-ai/nextstep-1","name":"Nextstep 1","created_by":"fal","source":"official","description":"Endpoint for NextStep-1 Autoregressive Image Editing model.","status":"active","release_date":"2025-08-19","model_type":"image","page_url":"https://fal.run/fal-ai/nextstep-1","tagline":"Endpoint for NextStep-1 Autoregressive Image Editing model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/nova-sr","name":"Nova SR","created_by":"fal","source":"official","description":"Enhance muffled 16 kHz speech audio into crystal-clear 48 kHz","status":"active","release_date":"2026-01-13","model_type":"other","page_url":"https://fal.run/fal-ai/nova-sr","tagline":"Enhance muffled 16 kHz speech audio into crystal-clear 48 kHz","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/nucleus-image","name":"Nucleus Image","created_by":"fal","source":"official","description":"Nucleus-Image is a text-to-image generation model built on a sparse mixture-of-experts (MoE) diffusion transformer architecture.","status":"active","release_date":"2026-04-16","model_type":"image","page_url":"https://fal.run/fal-ai/nucleus-image","tagline":"Nucleus-Image is a text-to-image generation model built on a sparse mixture-of-experts (MoE) diffusion transformer architecture.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/object-removal/bbox","name":"Object Removal","created_by":"fal","source":"official","description":"Removes box-selected objects and their visual effects, seamlessly reconstructing the scene with contextually appropriate content.","status":"active","release_date":"2025-06-16","model_type":"image","page_url":"https://fal.run/fal-ai/object-removal/bbox","tagline":"Removes box-selected objects and their visual effects, seamlessly reconstructing the scene with contextually appropriate content.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/object-removal/mask","name":"Object Removal","created_by":"fal","source":"official","description":"Removes mask-selected objects and their visual effects, seamlessly reconstructing the scene with contextually appropriate content.","status":"active","release_date":"2025-06-16","model_type":"image","page_url":"https://fal.run/fal-ai/object-removal/mask","tagline":"Removes mask-selected objects and their visual effects, seamlessly reconstructing the scene with contextually appropriate content.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/object-removal","name":"Object Removal","created_by":"fal","source":"official","description":"Removes objects and their visual effects using natural language, replacing them with contextually appropriate content","status":"active","release_date":"2025-06-16","model_type":"image","page_url":"https://fal.run/fal-ai/object-removal","tagline":"Removes objects and their visual effects using natural language, replacing them with contextually appropriate content","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/omni-zero","name":"Omni Zero","created_by":"fal","source":"official","description":"Any pose, any style, any identity","status":"active","release_date":"2024-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/omni-zero","tagline":"Any pose, any style, any identity","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/omnigen-v1","name":"OmniGen v1","created_by":"fal","source":"official","description":"OmniGen is a unified image generation model that can generate a wide range of images from multi-modal prompts.","status":"active","release_date":"2024-11-29","model_type":"image","page_url":"https://fal.run/fal-ai/omnigen-v1","tagline":"OmniGen is a unified image generation model that can generate a wide range of images from multi-modal prompts.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/omnigen-v2","name":"Omnigen V2","created_by":"fal","source":"official","description":"OmniGen is a unified image generation model that can generate a wide range of images from multi-modal prompts.","status":"active","release_date":"2025-06-25","model_type":"image","page_url":"https://fal.run/fal-ai/omnigen-v2","tagline":"OmniGen is a unified image generation model that can generate a wide range of images from multi-modal prompts.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/omnilottie/image-to-lottie","name":"Omnilottie","created_by":"fal","source":"official","description":"Convert your assets into lottie using Omnilottie.","status":"active","release_date":"2026-03-11","model_type":"other","page_url":"https://fal.run/fal-ai/omnilottie/image-to-lottie","tagline":"Convert your assets into lottie using Omnilottie.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/omnilottie/video-to-lottie","name":"Omnilottie","created_by":"fal","source":"official","description":"Convert your assets into lottie using Omnilottie.","status":"active","release_date":"2026-03-11","model_type":"other","page_url":"https://fal.run/fal-ai/omnilottie/video-to-lottie","tagline":"Convert your assets into lottie using Omnilottie.","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/omnilottie","name":"Omnilottie","created_by":"fal","source":"official","description":"Convert your assets into lottie using Omnilottie.","status":"active","release_date":"2026-03-11","model_type":"other","page_url":"https://fal.run/fal-ai/omnilottie","tagline":"Convert your assets into lottie using Omnilottie.","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/omnipart","name":"Omnipart","created_by":"fal","source":"official","description":"Image-to-3D endpoint for OmniPart, a part-aware 3D generator with semantic decoupling and structural cohesion.","status":"active","release_date":"2025-10-29","model_type":"other","page_url":"https://fal.run/fal-ai/omnipart","tagline":"Image-to-3D endpoint for OmniPart, a part-aware 3D generator with semantic decoupling and structural cohesion.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/one-to-all-animation/1.3b","name":"One To All Animation","created_by":"fal","source":"official","description":"One-to-All Animation is a pose driven video model that animates characters from a single reference image, enabling flexible, alignment-free motion transfer across diverse styles and scenes","status":"active","release_date":"2025-12-11","model_type":"other","page_url":"https://fal.run/fal-ai/one-to-all-animation/1.3b","tagline":"One-to-All Animation is a pose driven video model that animates characters from a single reference image, enabling flexible, alignment-free motion transfer across diverse styles and scenes","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/one-to-all-animation/14b","name":"One To All Animation","created_by":"fal","source":"official","description":"One-to-All Animation is a pose driven video model that animates characters from a single reference image, enabling flexible, alignment-free motion transfer across diverse styles and scenes","status":"active","release_date":"2025-12-11","model_type":"other","page_url":"https://fal.run/fal-ai/one-to-all-animation/14b","tagline":"One-to-All Animation is a pose driven video model that animates characters from a single reference image, enabling flexible, alignment-free motion transfer across diverse styles and scenes","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/onereward","name":"Onereward","created_by":"fal","source":"official","description":"OneReward is a finetuned version of Flux 1.0 Fill with intelligent editing capabilities.","status":"active","release_date":"2026-03-05","model_type":"image","page_url":"https://fal.run/fal-ai/onereward","tagline":"OneReward is a finetuned version of Flux 1.0 Fill with intelligent editing capabilities.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-05","last_updated":"2026-05-11"},{"id":"fal-ai/orpheus-tts","name":"Orpheus TTS","created_by":"fal","source":"official","description":"Orpheus TTS is a state-of-the-art, Llama-based Speech-LLM designed for high-quality, empathetic text-to-speech generation.","status":"active","release_date":"2025-03-31","model_type":"tts","page_url":"https://fal.run/fal-ai/orpheus-tts","tagline":"Orpheus TTS is a state-of-the-art, Llama-based Speech-LLM designed for high-quality, empathetic text-to-speech generation.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ovi/image-to-video","name":"Ovi","created_by":"fal","source":"official","description":"Ovi can generate videos with audio from image and text inputs.","status":"active","release_date":"2025-10-03","model_type":"video","page_url":"https://fal.run/fal-ai/ovi/image-to-video","tagline":"Ovi can generate videos with audio from image and text inputs.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ovi","name":"Ovi Text to Video","created_by":"fal","source":"official","description":"A unified paradigm for audio-video generation","status":"active","release_date":"2025-10-03","model_type":"video","page_url":"https://fal.run/fal-ai/ovi","tagline":"A unified paradigm for audio-video generation","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ovis-image","name":"Ovis Image","created_by":"fal","source":"official","description":"Ovis-Image is a 7B text-to-image model specifically optimized for quick, high quality text rendering.","status":"active","release_date":"2025-11-29","model_type":"image","page_url":"https://fal.run/fal-ai/ovis-image","tagline":"Ovis-Image is a 7B text-to-image model specifically optimized for quick, high quality text rendering.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pasd","name":"PASD","created_by":"fal","source":"official","description":"Pixel-Aware Diffusion Model for Realistic Image Super-Resolution and Personalized Stylization","status":"active","release_date":"2025-06-17","model_type":"image","page_url":"https://fal.run/fal-ai/pasd","tagline":"Pixel-Aware Diffusion Model for Realistic Image Super-Resolution and Personalized Stylization","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/patina/material/extract","name":"PATINA","created_by":"fal","source":"official","description":"Extract seamless tiling textures with PBR attribute maps from images","status":"active","release_date":"2026-04-08","model_type":"image","page_url":"https://fal.run/fal-ai/patina/material/extract","tagline":"Extract seamless tiling textures with PBR attribute maps from images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/patina/material","name":"PATINA","created_by":"fal","source":"official","description":"Generate complete seamlessly tiling PBR materials including normal, roughness, basecolor, height and metalness maps up to 8K","status":"active","release_date":"2026-04-08","model_type":"image","page_url":"https://fal.run/fal-ai/patina/material","tagline":"Generate complete seamlessly tiling PBR materials including normal, roughness, basecolor, height and metalness maps up to 8K","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/patina","name":"PATINA","created_by":"fal","source":"official","description":"PATINA creates seamless high-resolution normal, roughness, basecolor (albedo), height (displacement) and metalness maps from images","status":"active","release_date":"2026-04-08","model_type":"image","page_url":"https://fal.run/fal-ai/patina","tagline":"PATINA creates seamless high-resolution normal, roughness, basecolor (albedo), height (displacement) and metalness maps from images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/personaplex/realtime","name":"Personaplex","created_by":"fal","source":"official","description":"PersonaPlex is a real-time, full-duplex speech-to-speech conversational model that enables persona control through text-based role prompts and audio-based voice conditioning.","status":"active","release_date":"2026-02-20","model_type":"other","page_url":"https://fal.run/fal-ai/personaplex/realtime","tagline":"PersonaPlex is a real-time, full-duplex speech-to-speech conversational model that enables persona control through text-based role prompts and audio-based voice conditioning.","last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"fal-ai/personaplex","name":"Personaplex","created_by":"fal","source":"official","description":"PersonaPlex is a real-time, full-duplex speech-to-speech conversational model that enables persona control through text-based role prompts and audio-based voice conditioning.","status":"active","release_date":"2026-02-12","model_type":"other","page_url":"https://fal.run/fal-ai/personaplex","tagline":"PersonaPlex is a real-time, full-duplex speech-to-speech conversational model that enables persona control through text-based role prompts and audio-based voice conditioning.","capabilities":{"streaming":true},"last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"fal-ai/phota/create-profile","name":"Phota Create Profile","created_by":"fal","source":"official","description":"Generate profiles using 30-50 images of a subject with Phota.","status":"active","release_date":"2026-03-26","model_type":"other","page_url":"https://fal.run/fal-ai/phota/create-profile","tagline":"Generate profiles using 30-50 images of a subject with Phota.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/phota/edit","name":"Phota","created_by":"fal","source":"official","description":"Phota's model enables personalized photo editing, preserving identity while erasing distractions seamlessly.","status":"active","release_date":"2026-03-26","model_type":"image","page_url":"https://fal.run/fal-ai/phota/edit","tagline":"Phota's model enables personalized photo editing, preserving identity while erasing distractions seamlessly.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-27","last_updated":"2026-06-03"},{"id":"fal-ai/phota/enhance","name":"Phota Enhance","created_by":"fal","source":"official","description":"Enhance images while preserving identities with Phota","status":"active","release_date":"2026-03-26","model_type":"image","page_url":"https://fal.run/fal-ai/phota/enhance","tagline":"Enhance images while preserving identities with Phota","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-27","last_updated":"2026-06-03"},{"id":"fal-ai/phota","name":"Phota Text to Image","created_by":"fal","source":"official","description":"Phota's model empowers developers, photographers, and creators with personalized photograph generation and editing.","status":"active","release_date":"2026-03-26","model_type":"image","page_url":"https://fal.run/fal-ai/phota","tagline":"Phota's model empowers developers, photographers, and creators with personalized photograph generation and editing.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-27","last_updated":"2026-06-03"},{"id":"fal-ai/photomaker","name":"PhotoMaker","created_by":"fal","source":"official","description":"Customizing Realistic Human Photos via Stacked ID Embedding","status":"active","release_date":"2024-03-08","model_type":"image","page_url":"https://fal.run/fal-ai/photomaker","tagline":"Customizing Realistic Human Photos via Stacked ID Embedding","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/physic-edit","name":"Physic Edit","created_by":"fal","source":"official","description":"Physics-aware image editing with PhysicEdit.","status":"active","release_date":"2026-03-12","model_type":"image","page_url":"https://fal.run/fal-ai/physic-edit","tagline":"Physics-aware image editing with PhysicEdit.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-12","last_updated":"2026-05-11"},{"id":"fal-ai/piflow","name":"Piflow","created_by":"fal","source":"official","description":"Use the faster speed of piflow to generate images with same quality to that of slower models.","status":"active","release_date":"2025-10-27","model_type":"image","page_url":"https://fal.run/fal-ai/piflow","tagline":"Use the faster speed of piflow to generate images with same quality to that of slower models.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v1.5/pikaffects","name":"Pika Effects (v1.5)","created_by":"fal","source":"official","description":"Pika Effects are AI-powered video effects designed to modify objects, characters, and environments in a fun, engaging, and visually compelling manner.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v1.5/pikaffects","tagline":"Pika Effects are AI-powered video effects designed to modify objects, characters, and environments in a fun, engaging, and visually compelling manner.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2/pikadditions","name":"Pikadditions (v2)","created_by":"fal","source":"official","description":"Pikadditions is a powerful video-to-video AI model that allows you to add anyone or anything to any video with seamless integration.","status":"active","release_date":"2025-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/pika/v2/pikadditions","tagline":"Pikadditions is a powerful video-to-video AI model that allows you to add anyone or anything to any video with seamless integration.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2/turbo/image-to-video","name":"Pika Image to Video Turbo (v2)","created_by":"fal","source":"official","description":"Turbo is the model to use when you feel the need for speed.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2/turbo/image-to-video","tagline":"Turbo is the model to use when you feel the need for speed.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2/turbo/text-to-video","name":"Pika Text to Video Turbo (v2)","created_by":"fal","source":"official","description":"Pika v2 Turbo creates videos from a text prompt with high quality output.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2/turbo/text-to-video","tagline":"Pika v2 Turbo creates videos from a text prompt with high quality output.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2.1/image-to-video","name":"Pika Image to Video (v2.1)","created_by":"fal","source":"official","description":"Turn photos into mind-blowing, dynamic videos.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2.1/image-to-video","tagline":"Turn photos into mind-blowing, dynamic videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2.1/text-to-video","name":"Pika Text to Video (v2.1)","created_by":"fal","source":"official","description":"Start with a simple text input to create dynamic generations that defy expectations.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2.1/text-to-video","tagline":"Start with a simple text input to create dynamic generations that defy expectations.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2.2/image-to-video","name":"Pika Image to Video (v2.2)","created_by":"fal","source":"official","description":"Turn photos into mind-blowing, dynamic videos in up to 1080p.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2.2/image-to-video","tagline":"Turn photos into mind-blowing, dynamic videos in up to 1080p.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2.2/pikaframes","name":"Pika","created_by":"fal","source":"official","description":"Discover ultimate control with Pikaframes key frame interpolation, a stunning image-to-video feature that allows you to upload up to 5 keyframes, customize their transition length and prompt, and see ","status":"active","release_date":"2025-11-07","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2.2/pikaframes","tagline":"Discover ultimate control with Pikaframes key frame interpolation, a stunning image-to-video feature that allows you to upload up to 5 keyframes, customize their transition length and prompt, and see ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2.2/pikascenes","name":"Pika Scenes (v2.2)","created_by":"fal","source":"official","description":"Pika Scenes v2.2 creates videos from a images with high quality output.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2.2/pikascenes","tagline":"Pika Scenes v2.2 creates videos from a images with high quality output.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2.2/text-to-video","name":"Pika Text to Video (v2.2)","created_by":"fal","source":"official","description":"Start with a simple text input to create dynamic generations that defy expectations in up to 1080p.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2.2/text-to-video","tagline":"Start with a simple text input to create dynamic generations that defy expectations in up to 1080p.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pixal3d","name":"Pixal3d","created_by":"fal","source":"official","description":"Pixal3D turns a single image into a high-fidelity 3D model with detailed geometry and realistic textures.","status":"active","release_date":"2026-05-13","model_type":"other","page_url":"https://fal.run/fal-ai/pixal3d","tagline":"Pixal3D turns a single image into a high-fidelity 3D model with detailed geometry and realistic textures.","capabilities":{"vision":true},"last_seen_at":"2026-05-22","last_updated":"2026-06-03"},{"id":"fal-ai/pixart-sigma","name":"PixArt-Σ","created_by":"fal","source":"official","description":"Weak-to-Strong Training of Diffusion Transformer for 4K Text-to-Image Generation","status":"active","release_date":"2024-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/pixart-sigma","tagline":"Weak-to-Strong Training of Diffusion Transformer for 4K Text-to-Image Generation","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/pixverse/c1/image-to-video","name":"PixVerse C1 Image To Video","created_by":"fal","source":"official","description":"Animate images into cinematic videos with PixVerse C1, supporting 1080p resolution and native audio generation.","status":"active","release_date":"2026-04-08","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/c1/image-to-video","tagline":"Animate images into cinematic videos with PixVerse C1, supporting 1080p resolution and native audio generation.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/c1/reference-to-video","name":"PixVerse C1 Reference To Video","created_by":"fal","source":"official","description":"Generate character-consistent videos from reference images using PixVerse C1, with subject and background references.","status":"active","release_date":"2026-04-08","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/c1/reference-to-video","tagline":"Generate character-consistent videos from reference images using PixVerse C1, with subject and background references.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/c1/text-to-video","name":"PixVerse C1 Text To Video","created_by":"fal","source":"official","description":"Generate film-grade videos from text prompts with native audio, up to 1080p and 15 seconds, using PixVerse C1.","status":"active","release_date":"2026-04-08","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/c1/text-to-video","tagline":"Generate film-grade videos from text prompts with native audio, up to 1080p and 15 seconds, using PixVerse C1.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/c1/transition","name":"PixVerse C1 Transition","created_by":"fal","source":"official","description":"Create seamless cinematic transitions between two images with PixVerse C1, with native audio and up to 1080p.","status":"active","release_date":"2026-04-08","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/c1/transition","tagline":"Create seamless cinematic transitions between two images with PixVerse C1, with native audio and up to 1080p.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/extend/fast","name":"PixVerse Extend Fast","created_by":"fal","source":"official","description":"PixVerse Extend model is a video extending tool for your videos using with high-quality video extending techniques ","status":"active","release_date":"2025-06-30","model_type":"other","page_url":"https://fal.run/fal-ai/pixverse/extend/fast","tagline":"PixVerse Extend model is a video extending tool for your videos using with high-quality video extending techniques ","capabilities":{"tool_call":true},"tools":["function_calling"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/extend","name":"PixVerse Extend","created_by":"fal","source":"official","description":"PixVerse Extend model is a video extending tool for your videos using with high-quality video extending techniques ","status":"active","release_date":"2025-06-30","model_type":"other","page_url":"https://fal.run/fal-ai/pixverse/extend","tagline":"PixVerse Extend model is a video extending tool for your videos using with high-quality video extending techniques ","capabilities":{"tool_call":true},"tools":["function_calling"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/lipsync","name":"PixVerse Lipsync","created_by":"fal","source":"official","description":"Generate realistic lipsync animations from audio using advanced algorithms for high-quality synchronization with PixVerse Lipsync model","status":"active","release_date":"2025-06-30","model_type":"other","page_url":"https://fal.run/fal-ai/pixverse/lipsync","tagline":"Generate realistic lipsync animations from audio using advanced algorithms for high-quality synchronization with PixVerse Lipsync model","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/pixverse/sound-effects","name":"PixVerse Sound Effects","created_by":"fal","source":"official","description":"Add immersive sound effects and background music to your videos using PixVerse sound effects generation","status":"active","release_date":"2025-07-07","model_type":"other","page_url":"https://fal.run/fal-ai/pixverse/sound-effects","tagline":"Add immersive sound effects and background music to your videos using PixVerse sound effects generation","last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/swap","name":"PixVerse Swap","created_by":"fal","source":"official","description":"Generate high quality video clips by swapping person, objects and background using Pixverse Swap.","status":"active","release_date":"2025-11-10","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/swap","tagline":"Generate high quality video clips by swapping person, objects and background using Pixverse Swap.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v3.5/effects","name":"PixVerse V3.5 Effects","created_by":"fal","source":"official","description":"Generate high quality video clips with different effects using PixVerse v3.5","status":"active","release_date":"2025-04-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v3.5/effects","tagline":"Generate high quality video clips with different effects using PixVerse v3.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v3.5/image-to-video/fast","name":"PixVerse V3.5 Image To Video Fast","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts quickly using PixVerse v3.5 Fast","status":"active","release_date":"2025-01-29","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v3.5/image-to-video/fast","tagline":"Generate high quality video clips from text and image prompts quickly using PixVerse v3.5 Fast","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v3.5/image-to-video","name":"PixVerse V3.5 Image To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v3.5","status":"active","release_date":"2025-01-29","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v3.5/image-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v3.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v3.5/text-to-video/fast","name":"PixVerse V3.5 Text To Video Fast","created_by":"fal","source":"official","description":"Generate high quality video clips quickly from text prompts using PixVerse v3.5 Fast","status":"active","release_date":"2025-01-29","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v3.5/text-to-video/fast","tagline":"Generate high quality video clips quickly from text prompts using PixVerse v3.5 Fast","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v3.5/text-to-video","name":"PixVerse V3.5 Text To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text prompts using PixVerse v3.5","status":"active","release_date":"2025-01-29","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v3.5/text-to-video","tagline":"Generate high quality video clips from text prompts using PixVerse v3.5","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v3.5/transition","name":"PixVerse V3.5 Transition","created_by":"fal","source":"official","description":"Create seamless transition between images using PixVerse v3.5","status":"active","release_date":"2025-04-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v3.5/transition","tagline":"Create seamless transition between images using PixVerse v3.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4/effects","name":"PixVerse V4 Effects","created_by":"fal","source":"official","description":"Generate high quality video clips with different effects using PixVerse v4","status":"active","release_date":"2025-04-23","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4/effects","tagline":"Generate high quality video clips with different effects using PixVerse v4","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4/image-to-video/fast","name":"PixVerse V4 Image To Video Fast","created_by":"fal","source":"official","description":"Generate fast high quality video clips from text and image prompts using PixVerse v4","status":"active","release_date":"2025-04-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4/image-to-video/fast","tagline":"Generate fast high quality video clips from text and image prompts using PixVerse v4","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4/image-to-video","name":"PixVerse V4 Image To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v4","status":"active","release_date":"2025-04-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4/image-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v4","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4/text-to-video/fast","name":"PixVerse V4 Text To Video Fast","created_by":"fal","source":"official","description":"Generate high quality and fast video clips from text and image prompts using PixVerse v4 fast","status":"active","release_date":"2025-04-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4/text-to-video/fast","tagline":"Generate high quality and fast video clips from text and image prompts using PixVerse v4 fast","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4/text-to-video","name":"PixVerse V4 Text To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v4","status":"active","release_date":"2025-04-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4/text-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v4","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4.5/effects","name":"PixVerse V4.5 Effects","created_by":"fal","source":"official","description":"Generate high quality video clips with different effects using PixVerse v4.5","status":"active","release_date":"2025-05-15","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4.5/effects","tagline":"Generate high quality video clips with different effects using PixVerse v4.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4.5/image-to-video/fast","name":"PixVerse V4.5 Image To Video Fast","created_by":"fal","source":"official","description":"Generate fast high quality video clips from text and image prompts using PixVerse v4.5","status":"active","release_date":"2025-05-15","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4.5/image-to-video/fast","tagline":"Generate fast high quality video clips from text and image prompts using PixVerse v4.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4.5/image-to-video","name":"PixVerse V4.5 Image To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v4.5","status":"active","release_date":"2025-05-15","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4.5/image-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v4.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4.5/text-to-video/fast","name":"PixVerse V4.5 Text To Video Fast","created_by":"fal","source":"official","description":"Generate high quality and fast video clips from text and image prompts using PixVerse v4.5 fast","status":"active","release_date":"2025-05-15","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4.5/text-to-video/fast","tagline":"Generate high quality and fast video clips from text and image prompts using PixVerse v4.5 fast","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4.5/text-to-video","name":"PixVerse V4.5 Text To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v4.5","status":"active","release_date":"2025-05-15","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4.5/text-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v4.5","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4.5/transition","name":"PixVerse V4.5 Transition","created_by":"fal","source":"official","description":"Create seamless transition between images using PixVerse v4.5","status":"active","release_date":"2025-05-15","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4.5/transition","tagline":"Create seamless transition between images using PixVerse v4.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v5/effects","name":"PixVerse V5 Effects","created_by":"fal","source":"official","description":"Generate high quality video clips with different effects using PixVerse v5","status":"active","release_date":"2025-08-23","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5/effects","tagline":"Generate high quality video clips with different effects using PixVerse v5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v5/image-to-video","name":"PixVerse V5 Image To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v5","status":"active","release_date":"2025-08-23","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5/image-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/pixverse/v5/text-to-video","name":"PixVerse V5 Text To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v5","status":"active","release_date":"2025-08-23","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5/text-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v5","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v5/transition","name":"PixVerse V5 Transition","created_by":"fal","source":"official","description":"Create seamless transition between images using PixVerse v5","status":"active","release_date":"2025-08-23","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5/transition","tagline":"Create seamless transition between images using PixVerse v5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v5.5/effects","name":"PixVerse V5.5 Effects","created_by":"fal","source":"official","description":"Pixverse Effects","status":"active","release_date":"2025-12-02","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5.5/effects","tagline":"Pixverse Effects","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/pixverse/v5.5/image-to-video","name":"PixVerse V5.5 Image To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v5.5","status":"active","release_date":"2025-12-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5.5/image-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v5.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/pixverse/v5.5/text-to-video","name":"PixVerse V5.5 Text To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v5.5","status":"active","release_date":"2025-12-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5.5/text-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v5.5","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/pixverse/v5.5/transition","name":"PixVerse V5.5 Transition","created_by":"fal","source":"official","description":"Pixverse Transition","status":"active","release_date":"2025-12-02","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5.5/transition","tagline":"Pixverse Transition","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/pixverse/v5.6/image-to-video","name":"PixVerse V5.6 Image To Video","created_by":"fal","source":"official","description":"Use the latest pixverse v5.6 model to turn your texts and images into amazing videos.","status":"active","release_date":"2026-01-26","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5.6/image-to-video","tagline":"Use the latest pixverse v5.6 model to turn your texts and images into amazing videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v5.6/text-to-video","name":"PixVerse V5.6 Text To Video","created_by":"fal","source":"official","description":"Use the latest pixverse v5.6 model to turn your texts into amazing videos.","status":"active","release_date":"2026-01-26","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5.6/text-to-video","tagline":"Use the latest pixverse v5.6 model to turn your texts into amazing videos.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v5.6/transition","name":"PixVerse V5.6 Transition","created_by":"fal","source":"official","description":"Use the latest pixverse v5.6 model to turn your texts and images into amazing videos.","status":"active","release_date":"2026-01-26","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5.6/transition","tagline":"Use the latest pixverse v5.6 model to turn your texts and images into amazing videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/pixverse/v6/extend","name":"PixVerse V6 Extend","created_by":"fal","source":"official","description":"Pixverse's latest v6 Model.","status":"active","release_date":"2026-03-29","model_type":"other","page_url":"https://fal.run/fal-ai/pixverse/v6/extend","tagline":"Pixverse's latest v6 Model.","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/pixverse/v6/image-to-video","name":"PixVerse V6 Image To Video","created_by":"fal","source":"official","description":"Pixverse's latest V6 Model","status":"active","release_date":"2026-03-29","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v6/image-to-video","tagline":"Pixverse's latest V6 Model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v6/text-to-video","name":"PixVerse V6 Text To Video","created_by":"fal","source":"official","description":"Pixverse's latest v6 Model.","status":"active","release_date":"2026-03-29","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v6/text-to-video","tagline":"Pixverse's latest v6 Model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v6/transition","name":"PixVerse V6 Transition","created_by":"fal","source":"official","description":"Pixverse's latest v6 Model.","status":"active","release_date":"2026-03-29","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v6/transition","tagline":"Pixverse's latest v6 Model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/playground-v25/image-to-image","name":"Playground v2.5","created_by":"fal","source":"official","description":"State-of-the-art open-source model in aesthetic quality","status":"active","release_date":"2024-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/playground-v25/image-to-image","tagline":"State-of-the-art open-source model in aesthetic quality","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/playground-v25/inpainting","name":"Playground v2.5","created_by":"fal","source":"official","description":"State-of-the-art open-source model in aesthetic quality","status":"active","release_date":"2024-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/playground-v25/inpainting","tagline":"State-of-the-art open-source model in aesthetic quality","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/playground-v25","name":"Playground v2.5","created_by":"fal","source":"official","description":"State-of-the-art open-source model in aesthetic quality","status":"active","release_date":"2024-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/playground-v25","tagline":"State-of-the-art open-source model in aesthetic quality","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/plushify","name":"Plushify","created_by":"fal","source":"official","description":"Turn any image into a cute plushie!","status":"active","release_date":"2025-04-20","model_type":"image","page_url":"https://fal.run/fal-ai/plushify","tagline":"Turn any image into a cute plushie!","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pony-v7","name":"Pony V7","created_by":"fal","source":"official","description":"Pony V7 is a finetuned text to image for superior aesthetics and prompt following.","status":"active","release_date":"2025-05-05","model_type":"image","page_url":"https://fal.run/fal-ai/pony-v7","tagline":"Pony V7 is a finetuned text to image for superior aesthetics and prompt following.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/post-processing/blur","name":"Post Processing Blur","created_by":"fal","source":"official","description":"Apply Gaussian or Kuwahara blur effects with adjustable radius and sigma parameters","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/blur","tagline":"Apply Gaussian or Kuwahara blur effects with adjustable radius and sigma parameters","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/chromatic-aberration","name":"Post Processing Chromatic Aberration","created_by":"fal","source":"official","description":"Create chromatic aberration by shifting red, green, and blue channels horizontally or vertically with customizable shift amounts.","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/chromatic-aberration","tagline":"Create chromatic aberration by shifting red, green, and blue channels horizontally or vertically with customizable shift amounts.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/color-correction","name":"Post Processing Color Correction","created_by":"fal","source":"official","description":"Adjust color temperature, brightness, contrast, saturation, and gamma values for color correction.","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/color-correction","tagline":"Adjust color temperature, brightness, contrast, saturation, and gamma values for color correction.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/post-processing/color-tint","name":"Post Processing Color Tint","created_by":"fal","source":"official","description":"Apply various color tints (sepia, red, green, blue, cyan, magenta, yellow, purple, orange, warm, cool, lime, navy, vintage, rose, teal, maroon, peach, lavender, olive) with adjustable strength.","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/color-tint","tagline":"Apply various color tints (sepia, red, green, blue, cyan, magenta, yellow, purple, orange, warm, cool, lime, navy, vintage, rose, teal, maroon, peach, lavender, olive) with adjustable strength.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/desaturate","name":"Post Processing Desaturate","created_by":"fal","source":"official","description":"Reduce color saturation using different methods (luminance Rec.709, luminance Rec.601, average, lightness) with adjustable factor.","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/desaturate","tagline":"Reduce color saturation using different methods (luminance Rec.709, luminance Rec.601, average, lightness) with adjustable factor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/dissolve","name":"Post Processing Dissolve","created_by":"fal","source":"official","description":"Blend two images together using smooth linear interpolation with a configurable blend factor.","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/dissolve","tagline":"Blend two images together using smooth linear interpolation with a configurable blend factor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/dodge-burn","name":"Post Processing Dodge Burn","created_by":"fal","source":"official","description":"Apply dodge and burn effects with multiple modes and adjustable intensity.","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/dodge-burn","tagline":"Apply dodge and burn effects with multiple modes and adjustable intensity.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/grain","name":"Post Processing Grain","created_by":"fal","source":"official","description":"Apply film grain effect with different styles (modern, analog, kodak, fuji, cinematic, newspaper) and customizable intensity and scale","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/grain","tagline":"Apply film grain effect with different styles (modern, analog, kodak, fuji, cinematic, newspaper) and customizable intensity and scale","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/parabolize","name":"Post Processing Parabolize","created_by":"fal","source":"official","description":"Apply a parabolic distortion effect with configurable coefficient and vertex position.","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/parabolize","tagline":"Apply a parabolic distortion effect with configurable coefficient and vertex position.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/sharpen","name":"Post Processing Sharpen","created_by":"fal","source":"official","description":"Apply sharpening effects with three modes: basic unsharp mask, smart sharpening with edge preservation, and Contrast Adaptive Sharpening (CAS).","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/sharpen","tagline":"Apply sharpening effects with three modes: basic unsharp mask, smart sharpening with edge preservation, and Contrast Adaptive Sharpening (CAS).","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/post-processing/solarize","name":"Post Processing Solarize","created_by":"fal","source":"official","description":"Apply solarization effect by inverting pixel values above a threshold","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/solarize","tagline":"Apply solarization effect by inverting pixel values above a threshold","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/post-processing/vignette","name":"Post Processing Vignette","created_by":"fal","source":"official","description":"Add a darkening vignette effect around the edges of the image with adjustable strength","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/vignette","tagline":"Add a darkening vignette effect around the edges of the image with adjustable strength","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/post-processing","name":"Post Processing","created_by":"fal","source":"official","description":"Post Processing is an endpoint that can enhance images using a variety of techniques including grain, blur, sharpen, and more.","status":"active","release_date":"2025-02-18","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing","tagline":"Post Processing is an endpoint that can enhance images using a variety of techniques including grain, blur, sharpen, and more.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pshuman","name":"Pshuman","created_by":"fal","source":"official","description":"Use the 6D pose estimation capabilities of PSHuman to generate 3D files from single image.","status":"active","release_date":"2025-09-13","model_type":"other","page_url":"https://fal.run/fal-ai/pshuman","tagline":"Use the 6D pose estimation capabilities of PSHuman to generate 3D files from single image.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pulid","name":"PuLID","created_by":"fal","source":"official","description":"Tuning-free ID customization.","status":"active","release_date":"2023-12-14","model_type":"image","page_url":"https://fal.run/fal-ai/pulid","tagline":"Tuning-free ID customization.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/qwen-3-guard","name":"Qwen 3 Guard [8B]","created_by":"fal","source":"official","family":"qwen","description":"Use Qwen 3 Guard [8B] to detect and classify text as safe or harmful, delivering precise and reliable safety categorization.","status":"active","release_date":"2025-10-20","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-3-guard","tagline":"Use Qwen 3 Guard [8B] to detect and classify text as safe or harmful, delivering precise and reliable safety categorization.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-3-tts/clone-voice/0.6b","name":"Qwen 3 TTS - Clone Voice [0.6B]","created_by":"fal","source":"official","family":"qwen","description":"Clone your voices using Qwen3-TTS Clone-Voice model with zero shot cloning capabilities and use it on text-to-speech models to create speeches of yours!","status":"active","release_date":"2026-01-26","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-3-tts/clone-voice/0.6b","tagline":"Clone your voices using Qwen3-TTS Clone-Voice model with zero shot cloning capabilities and use it on text-to-speech models to create speeches of yours!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-3-tts/clone-voice/1.7b","name":"Qwen 3 TTS - Clone Voice [1.7B]","created_by":"fal","source":"official","family":"qwen","description":"Clone your voices using Qwen3-TTS Clone-Voice model with zero shot cloning capabilities and use it on text-to-speech models to create speeches of yours!","status":"active","release_date":"2026-01-26","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-3-tts/clone-voice/1.7b","tagline":"Clone your voices using Qwen3-TTS Clone-Voice model with zero shot cloning capabilities and use it on text-to-speech models to create speeches of yours!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-3-tts/text-to-speech/0.6b","name":"Qwen 3 TTS - Text to Speech [0.6B]","created_by":"fal","source":"official","family":"qwen","description":"Bring speech to your texts using Qwen3-TTS Custom-Voice model with pre-trained voices or use your custom voice with Qwen3-TTS Clone Voice model","status":"active","release_date":"2026-01-26","model_type":"tts","page_url":"https://fal.run/fal-ai/qwen-3-tts/text-to-speech/0.6b","tagline":"Bring speech to your texts using Qwen3-TTS Custom-Voice model with pre-trained voices or use your custom voice with Qwen3-TTS Clone Voice model","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-3-tts/text-to-speech/1.7b","name":"Qwen 3 TTS - Text to Speech [1.7B]","created_by":"fal","source":"official","family":"qwen","description":"Bring speech to your texts using Qwen3-TTS Custom-Voice model with pre-trained voices or use your custom voice with Qwen3-TTS Clone Voice model","status":"active","release_date":"2026-01-26","model_type":"tts","page_url":"https://fal.run/fal-ai/qwen-3-tts/text-to-speech/1.7b","tagline":"Bring speech to your texts using Qwen3-TTS Custom-Voice model with pre-trained voices or use your custom voice with Qwen3-TTS Clone Voice model","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-3-tts/voice-design/1.7b","name":"Qwen 3 TTS - Voice Design [1.7B]","created_by":"fal","source":"official","family":"qwen","description":"Create custom voices using Qwen3-TTS Voice Design model and later use Clone Voice model to create your own voices!","status":"active","release_date":"2026-01-26","model_type":"tts","page_url":"https://fal.run/fal-ai/qwen-3-tts/voice-design/1.7b","tagline":"Create custom voices using Qwen3-TTS Voice Design model and later use Clone Voice model to create your own voices!","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2/edit","name":"Qwen Image 2","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","status":"active","release_date":"2026-03-03","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-2/edit","tagline":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2/pro/edit","name":"Qwen Image 2","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","status":"active","release_date":"2026-03-03","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-2/pro/edit","tagline":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2/pro/text-to-image","name":"Qwen Image 2","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","status":"active","release_date":"2026-03-03","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-2/pro/text-to-image","tagline":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2/text-to-image","name":"Qwen Image 2","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","status":"active","release_date":"2026-03-03","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-2/text-to-image","tagline":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2512/lora","name":"Qwen Image 2512","created_by":"fal","source":"official","family":"qwen","description":"LoRA inference endpoint for Qwen Image 2512, an improved version of Qwen Image with better text rendering, finer natural textures, and more realistic human generation.","status":"active","release_date":"2026-01-02","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-2512/lora","tagline":"LoRA inference endpoint for Qwen Image 2512, an improved version of Qwen Image with better text rendering, finer natural textures, and more realistic human generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2512-trainer-v2","name":"Qwen Image 2512 Trainer V2","created_by":"fal","source":"official","family":"qwen","description":"Fast LoRA trainer for Qwen-Image-2512","status":"active","release_date":"2026-01-15","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-2512-trainer-v2","tagline":"Fast LoRA trainer for Qwen-Image-2512","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2512-trainer","name":"Qwen Image 2512 Trainer","created_by":"fal","source":"official","family":"qwen","description":"Qwen Image 2512 LoRA training","status":"active","release_date":"2026-01-01","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-2512-trainer","tagline":"Qwen Image 2512 LoRA training","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2512","name":"Qwen Image 2512","created_by":"fal","source":"official","family":"qwen","description":"Qwen Image 2512 is an improved version of Qwen Image with better text rendering, finer natural textures, and more realistic human generation.","status":"active","release_date":"2025-12-30","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-2512","tagline":"Qwen Image 2512 is an improved version of Qwen Image with better text rendering, finer natural textures, and more realistic human generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/add-background","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Add a realistic scene behind the object with white background","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/add-background","tagline":"Add a realistic scene behind the object with white background","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/face-to-full-portrait","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Generate full portrait from a cropped face photo","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/face-to-full-portrait","tagline":"Generate full portrait from a cropped face photo","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/group-photo","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Create group photos ","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/group-photo","tagline":"Create group photos ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/integrate-product","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Blend products into backgrounds with automatic perspective and lighting correction","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/integrate-product","tagline":"Blend products into backgrounds with automatic perspective and lighting correction","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/lighting-restoration","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Removes harsh shadows and light spots from images, replacing them with soft, even, natural-looking illumination.","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/lighting-restoration","tagline":"Removes harsh shadows and light spots from images, replacing them with soft, even, natural-looking illumination.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/multiple-angles","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Precise camera position and angle control (rotation, zoom, vertical movement)","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/multiple-angles","tagline":"Precise camera position and angle control (rotation, zoom, vertical movement)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/next-scene","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Create cinematic transitions and scene progressions (camera movements, framing changes)","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/next-scene","tagline":"Create cinematic transitions and scene progressions (camera movements, framing changes)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/remove-element","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Remove unwanted elements (objects, people, text) while maintaining image consistency","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/remove-element","tagline":"Remove unwanted elements (objects, people, text) while maintaining image consistency","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/remove-lighting","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Remove existing lighting and apply soft, even illumination","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/remove-lighting","tagline":"Remove existing lighting and apply soft, even illumination","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/shirt-design","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Apply designs/graphics onto people's shirts","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/shirt-design","tagline":"Apply designs/graphics onto people's shirts","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora","name":"Qwen Image Edit 2509 Lora","created_by":"fal","source":"official","family":"qwen","description":"LoRA endpoint for the Qwen Image Edit 2509 model.","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora","tagline":"LoRA endpoint for the Qwen Image Edit 2509 model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-trainer","name":"Qwen Image Edit 2509 Trainer","created_by":"fal","source":"official","family":"qwen","description":"LoRA trainer for Qwen Image Edit 2509","status":"active","release_date":"2025-12-15","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-trainer","tagline":"LoRA trainer for Qwen Image Edit 2509","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509","name":"Qwen Image Edit 2509","created_by":"fal","source":"official","family":"qwen","description":"Endpoint for Qwen's Image Editing Plus model also known as Qwen-Image-Edit-2509.","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509","tagline":"Endpoint for Qwen's Image Editing Plus model also known as Qwen-Image-Edit-2509.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2511/lora","name":"Qwen Image Edit 2511","created_by":"fal","source":"official","family":"qwen","description":"Endpoint for Qwen's Image Editing 2511 model with LoRa support.","status":"active","release_date":"2025-12-30","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2511/lora","tagline":"Endpoint for Qwen's Image Editing 2511 model with LoRa support.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2511-multiple-angles","name":"Qwen Image Edit 2511 Multiple Angles","created_by":"fal","source":"official","family":"qwen","description":"Generates same scene from different angles (azimuth/elevation) with Qwen image Edit 2511 and the Lora Multiple Angles","status":"active","release_date":"2026-01-07","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2511-multiple-angles","tagline":"Generates same scene from different angles (azimuth/elevation) with Qwen image Edit 2511 and the Lora Multiple Angles","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2511-trainer","name":"Qwen Image Edit 2511 Trainer","created_by":"fal","source":"official","family":"qwen","description":"LoRA trainer for Qwen Image Edit 2511","status":"active","release_date":"2025-12-23","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-edit-2511-trainer","tagline":"LoRA trainer for Qwen Image Edit 2511","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2511","name":"Qwen Image Edit 2511","created_by":"fal","source":"official","family":"qwen","description":"Endpoint for Qwen's Image Editing 2511 model.","status":"active","release_date":"2025-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2511","tagline":"Endpoint for Qwen's Image Editing 2511 model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit/image-to-image","name":"Qwen Image Edit","created_by":"fal","source":"official","family":"qwen","description":"Image to Image Endpoint for Qwen's Image Editing model.","status":"active","release_date":"2025-09-30","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit/image-to-image","tagline":"Image to Image Endpoint for Qwen's Image Editing model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit/inpaint","name":"Qwen Image Edit","created_by":"fal","source":"official","family":"qwen","description":"Inpainting Endpoint for the Qwen Edit Image editing model.","status":"active","release_date":"2025-09-17","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit/inpaint","tagline":"Inpainting Endpoint for the Qwen Edit Image editing model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/qwen-image-edit-lora","name":"Qwen Image Edit Lora","created_by":"fal","source":"official","family":"qwen","description":"LoRA inference endpoint for the Qwen Image Editing model.","status":"active","release_date":"2025-09-10","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-lora","tagline":"LoRA inference endpoint for the Qwen Image Editing model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/add-background","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Add a realistic scene behind the object with white background","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/add-background","tagline":"Add a realistic scene behind the object with white background","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/face-to-full-portrait","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Generate full portrait from a cropped face photo","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/face-to-full-portrait","tagline":"Generate full portrait from a cropped face photo","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/group-photo","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Create group photos ","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/group-photo","tagline":"Create group photos ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/integrate-product","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Blend products into backgrounds with automatic perspective and lighting correction","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/integrate-product","tagline":"Blend products into backgrounds with automatic perspective and lighting correction","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/lighting-restoration","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Removes harsh shadows and light spots from images, replacing them with soft, even, natural-looking illumination.","status":"active","release_date":"2025-12-12","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/lighting-restoration","tagline":"Removes harsh shadows and light spots from images, replacing them with soft, even, natural-looking illumination.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/multiple-angles","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Precise camera position and angle control (rotation, zoom, vertical movement)","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/multiple-angles","tagline":"Precise camera position and angle control (rotation, zoom, vertical movement)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/next-scene","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Create cinematic transitions and scene progressions (camera movements, framing changes)","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/next-scene","tagline":"Create cinematic transitions and scene progressions (camera movements, framing changes)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/remove-element","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Remove unwanted elements (objects, people, text) while maintaining image consistency","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/remove-element","tagline":"Remove unwanted elements (objects, people, text) while maintaining image consistency","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/remove-lighting","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Remove existing lighting and apply soft, even illumination","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/remove-lighting","tagline":"Remove existing lighting and apply soft, even illumination","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/shirt-design","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Apply designs/graphics onto people's shirts","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/shirt-design","tagline":"Apply designs/graphics onto people's shirts","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora","name":"Qwen Image Edit Plus Lora","created_by":"fal","source":"official","family":"qwen","description":"LoRA endpoint for the Qwen Image Edit Plus model.","status":"active","release_date":"2025-10-03","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora","tagline":"LoRA endpoint for the Qwen Image Edit Plus model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-trainer","name":"Qwen Image Edit Plus Trainer","created_by":"fal","source":"official","family":"qwen","description":"LoRA trainer for Qwen Image Edit Plus","status":"active","release_date":"2025-10-30","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-trainer","tagline":"LoRA trainer for Qwen Image Edit Plus","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus","name":"Qwen Image Edit Plus","created_by":"fal","source":"official","family":"qwen","description":"Endpoint for Qwen's Image Editing Plus model also known as Qwen-Image-Edit-2509.","status":"active","release_date":"2025-09-22","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus","tagline":"Endpoint for Qwen's Image Editing Plus model also known as Qwen-Image-Edit-2509.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-trainer","name":"Qwen Image Edit Trainer","created_by":"fal","source":"official","family":"qwen","description":"LoRA trainer for Qwen Image Edit","status":"active","release_date":"2025-10-30","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-edit-trainer","tagline":"LoRA trainer for Qwen Image Edit","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit","name":"Qwen Image Edit","created_by":"fal","source":"official","family":"qwen","description":"Endpoint for Qwen's Image Editing model.","status":"active","release_date":"2025-08-18","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit","tagline":"Endpoint for Qwen's Image Editing model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/qwen-image/image-to-image","name":"Qwen Image","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image (Image-to-Image) transforms and edits input images with high fidelity, enabling precise style transfer, enhancement, and creative modification.","status":"active","release_date":"2025-08-25","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image/image-to-image","tagline":"Qwen-Image (Image-to-Image) transforms and edits input images with high fidelity, enabling precise style transfer, enhancement, and creative modification.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/qwen-image-layered/lora","name":"Qwen Image Layered","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image-Layered is a model capable of decomposing an image into multiple RGBA layers.","status":"active","release_date":"2025-12-24","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-layered/lora","tagline":"Qwen-Image-Layered is a model capable of decomposing an image into multiple RGBA layers.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-layered-trainer","name":"Qwen Image Layered Trainer","created_by":"fal","source":"official","family":"qwen","description":"Train LoRAs for the Qwen-Image-Layered model, customize how images are split into layers.","status":"active","release_date":"2025-12-23","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-layered-trainer","tagline":"Train LoRAs for the Qwen-Image-Layered model, customize how images are split into layers.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-layered","name":"Qwen Image Layered","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image-Layered is a model capable of decomposing an image into multiple RGBA layers.","status":"active","release_date":"2025-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-layered","tagline":"Qwen-Image-Layered is a model capable of decomposing an image into multiple RGBA layers.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-max/edit","name":"Qwen Image Max","created_by":"fal","source":"official","family":"qwen","description":"Image editing endpoint for Qwen-Image-Max.","status":"active","release_date":"2026-01-27","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-max/edit","tagline":"Image editing endpoint for Qwen-Image-Max.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-max/text-to-image","name":"Qwen Image Max","created_by":"fal","source":"official","family":"qwen","description":"Text-to-Image endpoint for Qwen-Image-Max.","status":"active","release_date":"2026-01-27","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-max/text-to-image","tagline":"Text-to-Image endpoint for Qwen-Image-Max.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-trainer-v2","name":"Qwen Image Trainer V2","created_by":"fal","source":"official","family":"qwen","description":"Qwen Image LoRA training","status":"active","release_date":"2026-02-06","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-trainer-v2","tagline":"Qwen Image LoRA training","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-trainer","name":"Qwen Image Trainer","created_by":"fal","source":"official","family":"qwen","description":"Qwen Image LoRA training","status":"active","release_date":"2025-08-14","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-trainer","tagline":"Qwen Image LoRA training","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image","name":"Qwen Image","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image is an image generation foundation model in the Qwen series that achieves significant advances in complex text rendering and precise image editing.","status":"active","release_date":"2025-08-04","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image","tagline":"Qwen-Image is an image generation foundation model in the Qwen series that achieves significant advances in complex text rendering and precise image editing.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/realistic-vision","name":"Realistic Vision","created_by":"fal","source":"official","description":"Generate realistic images.","status":"active","release_date":"2024-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/realistic-vision","tagline":"Generate realistic images.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/reconviagen-0.5","name":"ReconViaGen 0.5","created_by":"fal","source":"official","description":"Generate 3D models from one or more images using ReconViaGen 0.5","status":"active","release_date":"2026-04-07","model_type":"other","page_url":"https://fal.run/fal-ai/reconviagen-0.5","tagline":"Generate 3D models from one or more images using ReconViaGen 0.5","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/recraft-20b","name":"Recraft 20b","created_by":"fal","source":"official","description":"Recraft 20b is a new and affordable text-to-image model.","status":"active","release_date":"2024-12-16","model_type":"image","parameters":20,"page_url":"https://fal.run/fal-ai/recraft-20b","tagline":"Recraft 20b is a new and affordable text-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/upscale/creative","name":"Recraft Creative Upscale","created_by":"fal","source":"official","description":"Enhances a given raster image using the 'creative upscale' tool, increasing image resolution, making the image sharper and cleaner.","status":"active","release_date":"2025-05-07","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/upscale/creative","tagline":"Enhances a given raster image using the 'creative upscale' tool, increasing image resolution, making the image sharper and cleaner.","capabilities":{"vision":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"tools":["function_calling"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/upscale/crisp","name":"Recraft Crisp Upscale","created_by":"fal","source":"official","description":"Enhances a given raster image using 'crisp upscale' tool, boosting resolution with a focus on refining small details and faces.","status":"active","release_date":"2025-05-07","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/upscale/crisp","tagline":"Enhances a given raster image using 'crisp upscale' tool, boosting resolution with a focus on refining small details and faces.","capabilities":{"vision":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"tools":["function_calling"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v3/create-style","name":"Recraft V3 Create Style","created_by":"fal","source":"official","description":"Recraft V3 Create Style is capable of creating unique styles for Recraft V3 based on your images.","status":"active","release_date":"2025-05-07","model_type":"other","page_url":"https://fal.run/fal-ai/recraft/v3/create-style","tagline":"Recraft V3 Create Style is capable of creating unique styles for Recraft V3 based on your images.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v3/image-to-image","name":"Recraft V3","created_by":"fal","source":"official","description":"Recraft V3 is a text-to-image model with the ability to generate long texts, vector art, images in brand style, and much more.","status":"active","release_date":"2025-05-07","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v3/image-to-image","tagline":"Recraft V3 is a text-to-image model with the ability to generate long texts, vector art, images in brand style, and much more.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v3/text-to-image","name":"Recraft V3","created_by":"fal","source":"official","description":"Recraft V3 is a text-to-image model with the ability to generate long texts, vector art, images in brand style, and much more.","status":"active","release_date":"2025-05-07","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v3/text-to-image","tagline":"Recraft V3 is a text-to-image model with the ability to generate long texts, vector art, images in brand style, and much more.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v4/pro/text-to-image","name":"Recraft V4 Pro","created_by":"fal","source":"official","description":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","status":"active","release_date":"2026-02-12","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4/pro/text-to-image","tagline":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v4/pro/text-to-vector","name":"Recraft V4 Pro (Vector)","created_by":"fal","source":"official","description":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","status":"active","release_date":"2026-02-16","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4/pro/text-to-vector","tagline":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-03","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v4/text-to-image","name":"Recraft V4","created_by":"fal","source":"official","description":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","status":"active","release_date":"2026-02-12","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4/text-to-image","tagline":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v4/text-to-vector","name":"Recraft V4 (Vector)","created_by":"fal","source":"official","description":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","status":"active","release_date":"2026-02-16","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4/text-to-vector","tagline":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-03","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v4.1/pro/text-to-image","name":"Recraft V4.1 Text to Image Pro","created_by":"fal","source":"official","description":"Recraft V4.1 Pro pushes the V4.1 model into high-resolution territory — up to 2048×2048 and ultra-wide formats.","status":"active","release_date":"2026-05-14","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4.1/pro/text-to-image","tagline":"Recraft V4.1 Pro pushes the V4.1 model into high-resolution territory — up to 2048×2048 and ultra-wide formats.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-14","last_updated":"2026-06-03"},{"id":"fal-ai/recraft/v4.1/pro/text-to-vector","name":"Recraft V4.1 Text to Vector Pro","created_by":"fal","source":"official","description":"Recraft V4.1 Pro Vector generates large-format, fully editable SVGs with the structural clarity professional illustrators expect.","status":"active","release_date":"2026-05-14","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4.1/pro/text-to-vector","tagline":"Recraft V4.1 Pro Vector generates large-format, fully editable SVGs with the structural clarity professional illustrators expect.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-14","last_updated":"2026-06-03"},{"id":"fal-ai/recraft/v4.1/text-to-image","name":"Recraft V4.1 Text to Image","created_by":"fal","source":"official","description":" Recraft V4.1 builds on the design-first foundation of V4 with sharper prompt control and cleaner composition.","status":"active","release_date":"2026-05-14","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4.1/text-to-image","tagline":" Recraft V4.1 builds on the design-first foundation of V4 with sharper prompt control and cleaner composition.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/recraft/v4.1/text-to-vector","name":"Recraft V4.1 Text to Vector","created_by":"fal","source":"official","description":"Recraft V4.1 Vector turns prompts into fully editable SVGs with structured layers and clean geometry.","status":"active","release_date":"2026-05-14","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4.1/text-to-vector","tagline":"Recraft V4.1 Vector turns prompts into fully editable SVGs with structured layers and clean geometry.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-14","last_updated":"2026-06-03"},{"id":"fal-ai/recraft/v4.1/utility/pro/text-to-image","name":"Recraft V4.1 Utility Text to Image","created_by":"fal","source":"official","description":"Recraft V4.1 Utility Pro pairs the high-resolution output of V4.1 Pro with a faster, cost-efficient runtime.","status":"active","release_date":"2026-05-14","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4.1/utility/pro/text-to-image","tagline":"Recraft V4.1 Utility Pro pairs the high-resolution output of V4.1 Pro with a faster, cost-efficient runtime.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-14","last_updated":"2026-06-03"},{"id":"fal-ai/recraft/v4.1/utility/text-to-image","name":"Recraft V4.1 Text to Image Utility","created_by":"fal","source":"official","description":"Recraft V4.1 Utility is a faster, lighter variant of V4.1 made for high-volume creative workflows.","status":"active","release_date":"2026-05-14","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4.1/utility/text-to-image","tagline":"Recraft V4.1 Utility is a faster, lighter variant of V4.1 made for high-volume creative workflows.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-14","last_updated":"2026-06-03"},{"id":"fal-ai/recraft/vectorize","name":"Recraft","created_by":"fal","source":"official","description":"Converts a given raster image to SVG format using Recraft model.","status":"active","release_date":"2025-06-12","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/vectorize","tagline":"Converts a given raster image to SVG format using Recraft model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/retoucher","name":"Face Retoucher","created_by":"fal","source":"official","description":"Automatically retouches faces to smooth skin and remove blemishes.","status":"active","release_date":"2024-02-13","model_type":"image","page_url":"https://fal.run/fal-ai/retoucher","tagline":"Automatically retouches faces to smooth skin and remove blemishes.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/rife/video","name":"RIFE","created_by":"fal","source":"official","description":"Interpolate videos with RIFE - Real-Time Intermediate Flow Estimation","status":"active","release_date":"2025-07-22","model_type":"other","page_url":"https://fal.run/fal-ai/rife/video","tagline":"Interpolate videos with RIFE - Real-Time Intermediate Flow Estimation","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/rife","name":"RIFE","created_by":"fal","source":"official","description":"Interpolate images with RIFE - Real-Time Intermediate Flow Estimation","status":"active","release_date":"2025-07-22","model_type":"image","page_url":"https://fal.run/fal-ai/rife","tagline":"Interpolate images with RIFE - Real-Time Intermediate Flow Estimation","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/sa2va/4b/image","name":"Sa2VA 4B Image","created_by":"fal","source":"official","description":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","status":"active","release_date":"2025-01-13","model_type":"other","page_url":"https://fal.run/fal-ai/sa2va/4b/image","tagline":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sa2va/4b/video","name":"Sa2VA 4B Video","created_by":"fal","source":"official","description":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","status":"active","release_date":"2025-01-13","model_type":"other","page_url":"https://fal.run/fal-ai/sa2va/4b/video","tagline":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sa2va/8b/image","name":"Sa2VA 8B Image","created_by":"fal","source":"official","description":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","status":"active","release_date":"2025-01-13","model_type":"other","page_url":"https://fal.run/fal-ai/sa2va/8b/image","tagline":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sa2va/8b/video","name":"Sa2VA 8B Video","created_by":"fal","source":"official","description":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","status":"active","release_date":"2025-01-13","model_type":"other","page_url":"https://fal.run/fal-ai/sa2va/8b/video","tagline":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sadtalker/reference","name":"Sad Talker","created_by":"fal","source":"official","description":"Learning Realistic 3D Motion Coefficients for Stylized Audio-Driven Single Image Talking Face Animation","status":"active","release_date":"2024-12-20","model_type":"video","page_url":"https://fal.run/fal-ai/sadtalker/reference","tagline":"Learning Realistic 3D Motion Coefficients for Stylized Audio-Driven Single Image Talking Face Animation","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/sadtalker","name":"Sad Talker","created_by":"fal","source":"official","description":"Learning Realistic 3D Motion Coefficients for Stylized Audio-Driven Single Image Talking Face Animation","status":"active","release_date":"2024-04-11","model_type":"video","page_url":"https://fal.run/fal-ai/sadtalker","tagline":"Learning Realistic 3D Motion Coefficients for Stylized Audio-Driven Single Image Talking Face Animation","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3-1/image-rle","name":"Sam 3 1","created_by":"fal","source":"official","description":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","status":"active","release_date":"2026-03-30","model_type":"image","page_url":"https://fal.run/fal-ai/sam-3-1/image-rle","tagline":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3-1/image","name":"Sam 3 1","created_by":"fal","source":"official","description":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","status":"active","release_date":"2026-03-30","model_type":"image","page_url":"https://fal.run/fal-ai/sam-3-1/image","tagline":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3-1/video-rle","name":"Sam 3 1","created_by":"fal","source":"official","description":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","status":"active","release_date":"2026-03-30","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3-1/video-rle","tagline":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3-1/video","name":"Sam 3 1","created_by":"fal","source":"official","description":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","status":"active","release_date":"2026-03-30","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3-1/video","tagline":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/3d-align","name":"Sam 3","created_by":"fal","source":"official","description":"SAM 3D enables full scene reconstructions, placing objects and humans in a shared context together.","status":"active","release_date":"2025-12-02","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3/3d-align","tagline":"SAM 3D enables full scene reconstructions, placing objects and humans in a shared context together.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/3d-body","name":"Sam 3","created_by":"fal","source":"official","description":"SAM 3D allows for accurate 3D reconstruction of human body shape and position from a single image.","status":"active","release_date":"2025-12-02","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3/3d-body","tagline":"SAM 3D allows for accurate 3D reconstruction of human body shape and position from a single image.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/3d-objects","name":"Sam 3","created_by":"fal","source":"official","description":"SAM 3D enables precise 3D reconstruction of objects from real images, while accurately reconstructing their geometry and texture.","status":"active","release_date":"2025-12-02","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3/3d-objects","tagline":"SAM 3D enables precise 3D reconstruction of objects from real images, while accurately reconstructing their geometry and texture.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/image/embed","name":"Sam 3","created_by":"fal","source":"official","description":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","status":"active","release_date":"2025-11-20","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3/image/embed","tagline":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/image-rle","name":"Sam 3","created_by":"fal","source":"official","description":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","status":"active","release_date":"2025-11-20","model_type":"image","page_url":"https://fal.run/fal-ai/sam-3/image-rle","tagline":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/image","name":"Segment Anything Model 3","created_by":"fal","source":"official","description":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","status":"active","release_date":"2025-11-20","model_type":"image","page_url":"https://fal.run/fal-ai/sam-3/image","tagline":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/video-rle","name":"Sam 3","created_by":"fal","source":"official","description":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","status":"active","release_date":"2025-11-20","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3/video-rle","tagline":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/video","name":"Sam 3","created_by":"fal","source":"official","description":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","status":"active","release_date":"2025-11-20","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3/video","tagline":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-audio/separate","name":"Sam Audio","created_by":"fal","source":"official","description":"Audio separation with SAM Audio.","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/sam-audio/separate","tagline":"Audio separation with SAM Audio.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-audio/span-separate","name":"Sam Audio","created_by":"fal","source":"official","description":"Audio separation with SAM Audio.","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/sam-audio/span-separate","tagline":"Audio separation with SAM Audio.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-audio/visual-separate","name":"Sam Audio","created_by":"fal","source":"official","description":"Audio separation with SAM Audio.","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/sam-audio/visual-separate","tagline":"Audio separation with SAM Audio.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam2/auto-segment","name":"Segment Anything Model 2","created_by":"fal","source":"official","description":"SAM 2 is a model for segmenting images automatically.","status":"active","release_date":"2025-02-25","model_type":"image","page_url":"https://fal.run/fal-ai/sam2/auto-segment","tagline":"SAM 2 is a model for segmenting images automatically.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam2/image","name":"Segment Anything Model 2","created_by":"fal","source":"official","description":"SAM 2 is a model for segmenting images and videos in real-time.","status":"active","release_date":"2024-08-15","model_type":"image","page_url":"https://fal.run/fal-ai/sam2/image","tagline":"SAM 2 is a model for segmenting images and videos in real-time.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam2/video","name":"Segment Anything Model 2","created_by":"fal","source":"official","description":"SAM 2 is a model for segmenting images and videos in real-time.","status":"active","release_date":"2024-08-15","model_type":"other","page_url":"https://fal.run/fal-ai/sam2/video","tagline":"SAM 2 is a model for segmenting images and videos in real-time.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sana/sprint","name":"Sana Sprint","created_by":"fal","source":"official","description":"Sana Sprint is a text-to-image model capable of generating 4K images with exceptional speed.","status":"active","release_date":"2025-03-31","model_type":"image","page_url":"https://fal.run/fal-ai/sana/sprint","tagline":"Sana Sprint is a text-to-image model capable of generating 4K images with exceptional speed.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sana/v1.5/1.6b","name":"Sana v1.5 1.6B","created_by":"fal","source":"official","description":"Sana v1.5 1.6B is a lightweight text-to-image model that delivers 4K image generation with impressive efficiency.","status":"active","release_date":"2025-03-31","model_type":"image","page_url":"https://fal.run/fal-ai/sana/v1.5/1.6b","tagline":"Sana v1.5 1.6B is a lightweight text-to-image model that delivers 4K image generation with impressive efficiency.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sana/v1.5/4.8b","name":"Sana v1.5 4.8B","created_by":"fal","source":"official","description":"Sana v1.5 4.8B is a powerful text-to-image model that generates ultra-high quality 4K images with remarkable detail.","status":"active","release_date":"2025-03-31","model_type":"image","page_url":"https://fal.run/fal-ai/sana/v1.5/4.8b","tagline":"Sana v1.5 4.8B is a powerful text-to-image model that generates ultra-high quality 4K images with remarkable detail.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sana-video","name":"Sana Video","created_by":"fal","source":"official","description":"Leverage Sana's ultra-fast processing speed to generate high-quality assets that transform your text prompts into production-ready videos","status":"active","release_date":"2025-11-07","model_type":"video","page_url":"https://fal.run/fal-ai/sana-video","tagline":"Leverage Sana's ultra-fast processing speed to generate high-quality assets that transform your text prompts into production-ready videos","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/sana","name":"Sana","created_by":"fal","source":"official","description":"Sana can synthesize high-resolution, high-quality images with strong text-image alignment at a remarkably fast speed, with the ability to generate 4K images in less than a second.","status":"active","release_date":"2024-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/sana","tagline":"Sana can synthesize high-resolution, high-quality images with strong text-image alignment at a remarkably fast speed, with the ability to generate 4K images in less than a second.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/scail-2","name":"Scail 2","created_by":"fal","source":"official","description":"SCAIL-2 is an end-to-end character animation model that drives a reference character from a source video without relying on intermediate pose representations like skeleton maps.","status":"active","release_date":"2026-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/scail-2","tagline":"SCAIL-2 is an end-to-end character animation model that drives a reference character from a source video without relying on intermediate pose representations like skeleton maps.","last_seen_at":"2026-06-18","last_updated":"2026-06-20"},{"id":"fal-ai/scail","name":"Scail","created_by":"fal","source":"official","description":"SCAIL is a character animation model that uses 3D consistent pose representations to animate reference images with coherent motion, supporting complex movements.","status":"active","release_date":"2025-12-17","model_type":"other","page_url":"https://fal.run/fal-ai/scail","tagline":"SCAIL is a character animation model that uses 3D consistent pose representations to animate reference images with coherent motion, supporting complex movements.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/scene-finder","name":"Scene Finder","created_by":"fal","source":"official","description":"Search any video with a text prompt - Scene Finder locates the matching moments and returns their time segments and extracted frames.","status":"active","release_date":"2026-06-03","model_type":"other","page_url":"https://fal.run/fal-ai/scene-finder","tagline":"Search any video with a text prompt - Scene Finder locates the matching moments and returns their time segments and extracted frames.","capabilities":{"vision":true},"last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/sd15-depth-controlnet","name":"SD 1.5 Depth ControlNet","created_by":"fal","source":"official","description":"SD 1.5 ControlNet","status":"active","release_date":"2024-05-31","model_type":"image","page_url":"https://fal.run/fal-ai/sd15-depth-controlnet","tagline":"SD 1.5 ControlNet","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/sdxl-controlnet-union/image-to-image","name":"SDXL ControlNet Union","created_by":"fal","source":"official","description":"An efficent SDXL multi-controlnet image-to-image model.","status":"active","release_date":"2024-07-31","model_type":"image","page_url":"https://fal.run/fal-ai/sdxl-controlnet-union/image-to-image","tagline":"An efficent SDXL multi-controlnet image-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/sdxl-controlnet-union/inpainting","name":"SDXL ControlNet Union","created_by":"fal","source":"official","description":"An efficent SDXL multi-controlnet inpainting model.","status":"active","release_date":"2024-07-31","model_type":"image","page_url":"https://fal.run/fal-ai/sdxl-controlnet-union/inpainting","tagline":"An efficent SDXL multi-controlnet inpainting model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/sdxl-controlnet-union","name":"SDXL ControlNet Union","created_by":"fal","source":"official","description":"An efficent SDXL multi-controlnet text-to-image model.","status":"active","release_date":"2024-07-31","model_type":"image","page_url":"https://fal.run/fal-ai/sdxl-controlnet-union","tagline":"An efficent SDXL multi-controlnet text-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/seedvr/upscale/image/seamless","name":"SeedVR2","created_by":"fal","source":"official","description":"Use SeedVR2 to upscale images, retaining seamless tiling","status":"active","release_date":"2026-03-23","model_type":"image","page_url":"https://fal.run/fal-ai/seedvr/upscale/image/seamless","tagline":"Use SeedVR2 to upscale images, retaining seamless tiling","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-26","last_updated":"2026-06-03"},{"id":"fal-ai/seedvr/upscale/image","name":"SeedVR2","created_by":"fal","source":"official","description":"Use SeedVR2 to upscale your images","status":"active","release_date":"2025-09-22","model_type":"image","page_url":"https://fal.run/fal-ai/seedvr/upscale/image","tagline":"Use SeedVR2 to upscale your images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-26","last_updated":"2026-06-03"},{"id":"fal-ai/seedvr/upscale/video","name":"SeedVR2","created_by":"fal","source":"official","description":"Upscale your videos using SeedVR2 with temporal consistency!","status":"active","release_date":"2025-09-22","model_type":"other","page_url":"https://fal.run/fal-ai/seedvr/upscale/video","tagline":"Upscale your videos using SeedVR2 with temporal consistency!","last_seen_at":"2026-05-26","last_updated":"2026-06-03"},{"id":"fal-ai/sensenova-u1-infographic","name":"Sensenova U1 Infographic","created_by":"fal","source":"official","description":"Generate Infographic Image with Sensenova U1","status":"active","release_date":"2026-06-17","model_type":"image","page_url":"https://fal.run/fal-ai/sensenova-u1-infographic","tagline":"Generate Infographic Image with Sensenova U1","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/silero-vad","name":"Silero VAD","created_by":"fal","source":"official","description":"Detect speech presence and timestamps with accuracy and speed using the ultra-lightweight Silero VAD model","status":"active","release_date":"2026-01-08","model_type":"transcription","page_url":"https://fal.run/fal-ai/silero-vad","tagline":"Detect speech presence and timestamps with accuracy and speed using the ultra-lightweight Silero VAD model","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/skyreels-i2v","name":"Skyreels V1 (Image-to-Video)","created_by":"fal","source":"official","description":"SkyReels V1 is the first and most advanced open-source human-centric video foundation model.","status":"active","release_date":"2025-02-18","model_type":"video","page_url":"https://fal.run/fal-ai/skyreels-i2v","tagline":"SkyReels V1 is the first and most advanced open-source human-centric video foundation model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/smart-resize","name":"Smart Resize","created_by":"fal","source":"official","description":" Smart image resize to arbitrary dimensions, powered by Nano Banana Pro with vision-LLM-guided prompting for composition-aware recomposition.","status":"active","release_date":"2026-04-28","model_type":"image","page_url":"https://fal.run/fal-ai/smart-resize","tagline":" Smart image resize to arbitrary dimensions, powered by Nano Banana Pro with vision-LLM-guided prompting for composition-aware recomposition.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/smart-turn","name":"Pipecat's Smart Turn model","created_by":"fal","source":"official","description":"An open source, community-driven and native audio turn detection model by Pipecat AI.","status":"active","release_date":"2025-04-21","model_type":"transcription","page_url":"https://fal.run/fal-ai/smart-turn","tagline":"An open source, community-driven and native audio turn detection model by Pipecat AI.","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sora-2/characters","name":"Sora 2","created_by":"fal","source":"official","family":"sora-2","description":"Generate character ids to use with Sora 2 generations","status":"active","release_date":"2026-03-12","model_type":"video","page_url":"https://fal.run/fal-ai/sora-2/characters","tagline":"Generate character ids to use with Sora 2 generations","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-03-13","last_updated":"2026-05-11"},{"id":"fal-ai/sora-2/image-to-video/pro","name":"Sora 2","created_by":"fal","source":"official","family":"sora-2","description":"Image-to-video endpoint for Sora 2 Pro, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","status":"active","release_date":"2025-10-06","model_type":"video","page_url":"https://fal.run/fal-ai/sora-2/image-to-video/pro","tagline":"Image-to-video endpoint for Sora 2 Pro, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/sora-2/image-to-video","name":"Sora 2","created_by":"fal","source":"official","family":"sora-2","description":"Image-to-video endpoint for Sora 2, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","status":"active","release_date":"2025-10-06","model_type":"video","page_url":"https://fal.run/fal-ai/sora-2/image-to-video","tagline":"Image-to-video endpoint for Sora 2, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/sora-2/text-to-video/pro","name":"Sora 2","created_by":"fal","source":"official","family":"sora-2","description":"Text-to-video endpoint for Sora 2 Pro, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","status":"active","release_date":"2025-10-06","model_type":"video","page_url":"https://fal.run/fal-ai/sora-2/text-to-video/pro","tagline":"Text-to-video endpoint for Sora 2 Pro, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","capabilities":{"vision":true},"modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/sora-2/text-to-video","name":"Sora 2","created_by":"fal","source":"official","family":"sora-2","description":"Text-to-video endpoint for Sora 2, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","status":"active","release_date":"2025-10-06","model_type":"video","page_url":"https://fal.run/fal-ai/sora-2/text-to-video","tagline":"Text-to-video endpoint for Sora 2, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","capabilities":{"vision":true},"modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/sora-2/video-to-video/remix","name":"Sora 2","created_by":"fal","source":"official","family":"sora-2","description":"Video-to-video remix endpoint for Sora 2, OpenAI’s advanced model that transforms existing videos based on new text or image prompts allowing rich edits, style changes, and creative reinterpretations ","status":"active","release_date":"2025-10-08","model_type":"other","page_url":"https://fal.run/fal-ai/sora-2/video-to-video/remix","tagline":"Video-to-video remix endpoint for Sora 2, OpenAI’s advanced model that transforms existing videos based on new text or image prompts allowing rich edits, style changes, and creative reinterpretations ","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/speech-to-text/stream","name":"Speech-To-text","created_by":"fal","source":"official","description":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","status":"active","release_date":"2025-04-04","model_type":"transcription","page_url":"https://fal.run/fal-ai/speech-to-text/stream","tagline":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/speech-to-text/turbo/stream","name":"Speech-to-Text","created_by":"fal","source":"official","description":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","status":"active","release_date":"2025-04-04","model_type":"transcription","page_url":"https://fal.run/fal-ai/speech-to-text/turbo/stream","tagline":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/speech-to-text/turbo","name":"Speech-to-Text","created_by":"fal","source":"official","description":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","status":"active","release_date":"2025-04-04","model_type":"transcription","page_url":"https://fal.run/fal-ai/speech-to-text/turbo","tagline":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/speech-to-text","name":"Speech-to-Text","created_by":"fal","source":"official","description":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","status":"active","release_date":"2025-04-04","model_type":"transcription","page_url":"https://fal.run/fal-ai/speech-to-text","tagline":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","capabilities":{"streaming":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-audio-25/audio-to-audio","name":"Stable Audio 2.5","created_by":"fal","source":"official","description":"Generate high quality music and sound effects using Stable Audio 2.5 from StabilityAI","status":"active","release_date":"2025-09-10","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-25/audio-to-audio","tagline":"Generate high quality music and sound effects using Stable Audio 2.5 from StabilityAI","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/stable-audio-25/inpaint","name":"Stable Audio 25","created_by":"fal","source":"official","description":"Generate high quality music and sound effects using Stable Audio 2.5 from StabilityAI","status":"active","release_date":"2025-09-10","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-25/inpaint","tagline":"Generate high quality music and sound effects using Stable Audio 2.5 from StabilityAI","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/stable-audio-25/text-to-audio","name":"Stable Audio 2.5","created_by":"fal","source":"official","description":"Generate high quality music and sound effects using Stable Audio 2.5 from StabilityAI","status":"active","release_date":"2025-09-10","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-25/text-to-audio","tagline":"Generate high quality music and sound effects using Stable Audio 2.5 from StabilityAI","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/stable-audio-3/medium/audio-inpainting","name":"Stable Audio 3 Medium Audio Inpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Medium audio inpainting is a 1.4 billion parameter latent diffusion model that fills in or reworks selected segments of a stereo track guided by text prompts, supporting single- and mul","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/audio-inpainting","tagline":"Stable Audio 3 Medium audio inpainting is a 1.4 billion parameter latent diffusion model that fills in or reworks selected segments of a stereo track guided by text prompts, supporting single- and mul","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/medium/audio-outpainting","name":"Stable Audio 3 Medium Audio Outpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Medium audio outpainting is a 1.4 billion parameter latent diffusion model that extends existing stereo audio beyond its original endpoint via causal continuation guided by text prompts","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/audio-outpainting","tagline":"Stable Audio 3 Medium audio outpainting is a 1.4 billion parameter latent diffusion model that extends existing stereo audio beyond its original endpoint via causal continuation guided by text prompts","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/medium/audio-to-audio","name":"Stable Audio 3 Medium Audio to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Medium audio-to-audio is a 1.4 billion parameter latent diffusion model that transforms an input audio clip into new stereo variations up to 6 minutes guided by a text prompt.","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/audio-to-audio","tagline":"Stable Audio 3 Medium audio-to-audio is a 1.4 billion parameter latent diffusion model that transforms an input audio clip into new stereo variations up to 6 minutes guided by a text prompt.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/medium/base/audio-inpainting","name":"Stable Audio 3 Medium Base Audio Inpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Medium Base audio inpainting is the foundational 1.4 billion parameter checkpoint for editing or filling selected stereo audio segments guided by text prompts.","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/base/audio-inpainting","tagline":"Stable Audio 3 Medium Base audio inpainting is the foundational 1.4 billion parameter checkpoint for editing or filling selected stereo audio segments guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/medium/base/audio-outpainting","name":"Stable Audio 3 Medium Base Audio Outpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Medium Base audio outpainting is the foundational 1.4 billion parameter checkpoint that extends existing stereo audio with causal continuation guided by text prompts.","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/base/audio-outpainting","tagline":"Stable Audio 3 Medium Base audio outpainting is the foundational 1.4 billion parameter checkpoint that extends existing stereo audio with causal continuation guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/medium/base/audio-to-audio","name":"Stable Audio 3 Medium Base Audio to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Medium Base audio-to-audio is the foundational 1.4 billion parameter checkpoint that transforms input audio into new stereo variations up to 6 minutes guided by text prompts.","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/base/audio-to-audio","tagline":"Stable Audio 3 Medium Base audio-to-audio is the foundational 1.4 billion parameter checkpoint that transforms input audio into new stereo variations up to 6 minutes guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/medium/base/text-to-audio","name":"Stable Audio 3 Medium Base Text to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Medium Base is the foundational 1.4 billion parameter text-to-audio checkpoint generating stereo music up to 6 minutes, intended as the unmodified base for custom fine-tuning workflows.","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/base/text-to-audio","tagline":"Stable Audio 3 Medium Base is the foundational 1.4 billion parameter text-to-audio checkpoint generating stereo music up to 6 minutes, intended as the unmodified base for custom fine-tuning workflows.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/medium/text-to-audio","name":"Stable Audio 3","created_by":"fal","source":"official","description":"Stable Audio 3 Medium is a 1.4 billion parameter latent diffusion model that generates high-quality stereo music up to 6 minutes from text prompts, trained on fully licensed data for safe commercial u","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/text-to-audio","tagline":"Stable Audio 3 Medium is a 1.4 billion parameter latent diffusion model that generates high-quality stereo music up to 6 minutes from text prompts, trained on fully licensed data for safe commercial u","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/audio-inpainting","name":"Stable Audio 3 Small Music Audio Inpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music audio inpainting is a 459 million parameter latent diffusion model that fills in or reworks selected segments of a music track guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/audio-inpainting","tagline":"Stable Audio 3 Small Music audio inpainting is a 459 million parameter latent diffusion model that fills in or reworks selected segments of a music track guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/audio-outpainting","name":"Stable Audio 3 Small Music Audio Outpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music audio outpainting is a 459 million parameter latent diffusion model that extends music compositions beyond their original endpoint via causal continuation.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/audio-outpainting","tagline":"Stable Audio 3 Small Music audio outpainting is a 459 million parameter latent diffusion model that extends music compositions beyond their original endpoint via causal continuation.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/audio-to-audio","name":"Stable Audio 3","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music audio-to-audio is a 459 million parameter latent diffusion model that transforms input music into new variations up to 2 minutes guided by text prompts.","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/audio-to-audio","tagline":"Stable Audio 3 Small Music audio-to-audio is a 459 million parameter latent diffusion model that transforms input music into new variations up to 2 minutes guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/base/audio-inpainting","name":"Stable Audio 3 Small Music Base Audio Inpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music Base audio inpainting is the foundational 459 million parameter checkpoint for editing or filling selected music segments guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/base/audio-inpainting","tagline":"Stable Audio 3 Small Music Base audio inpainting is the foundational 459 million parameter checkpoint for editing or filling selected music segments guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/base/audio-outpainting","name":"Stable Audio 3 Small Music Base Audio Outpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music Base audio outpainting is the foundational 459 million parameter checkpoint that extends music tracks via causal continuation guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/base/audio-outpainting","tagline":"Stable Audio 3 Small Music Base audio outpainting is the foundational 459 million parameter checkpoint that extends music tracks via causal continuation guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/base/audio-to-audio","name":"Stable Audio 3 Small Music Base Audio to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music Base audio-to-audio is the foundational 459 million parameter checkpoint that transforms input music into new variations up to 2 minutes guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/base/audio-to-audio","tagline":"Stable Audio 3 Small Music Base audio-to-audio is the foundational 459 million parameter checkpoint that transforms input music into new variations up to 2 minutes guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/base/text-to-audio","name":"Stable Audio 3","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music Base is the foundational 459 million parameter checkpoint generating full music compositions up to 2 minutes from text prompts, intended as the unmodified base for fine-tuni","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/base/text-to-audio","tagline":"Stable Audio 3 Small Music Base is the foundational 459 million parameter checkpoint generating full music compositions up to 2 minutes from text prompts, intended as the unmodified base for fine-tuni","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/text-to-audio","name":"Stable Audio 3 Small Music Text to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music is a 459 million parameter latent diffusion model that generates full stereo music compositions up to 2 minutes from text prompts, lightweight enough for on-device deploymen","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/text-to-audio","tagline":"Stable Audio 3 Small Music is a 459 million parameter latent diffusion model that generates full stereo music compositions up to 2 minutes from text prompts, lightweight enough for on-device deploymen","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/audio-inpainting","name":"Stable Audio 3 Small SFX Audio Inpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX audio inpainting is a 459 million parameter latent diffusion model that fills in or reworks selected segments of a sound-effect track guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/audio-inpainting","tagline":"Stable Audio 3 Small SFX audio inpainting is a 459 million parameter latent diffusion model that fills in or reworks selected segments of a sound-effect track guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/audio-outpainting","name":"Stable Audio 3 Small SFX Audio Outpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX audio outpainting is a 459 million parameter latent diffusion model that extends sound-effect tracks beyond their original endpoint via causal continuation.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/audio-outpainting","tagline":"Stable Audio 3 Small SFX audio outpainting is a 459 million parameter latent diffusion model that extends sound-effect tracks beyond their original endpoint via causal continuation.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/audio-to-audio","name":"Stable Audio 3","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX audio-to-audio is a 459 million parameter latent diffusion model that transforms input audio into new sound-effect variations guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/audio-to-audio","tagline":"Stable Audio 3 Small SFX audio-to-audio is a 459 million parameter latent diffusion model that transforms input audio into new sound-effect variations guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/base/audio-inpainting","name":"Stable Audio 3 Small SFX Base Audio Inpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX Base audio inpainting is the foundational 459 million parameter checkpoint for editing or filling selected sound-effect segments guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/base/audio-inpainting","tagline":"Stable Audio 3 Small SFX Base audio inpainting is the foundational 459 million parameter checkpoint for editing or filling selected sound-effect segments guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/base/audio-outpainting","name":"Stable Audio 3 Small SFX Base Audio Outpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX Base audio outpainting is the foundational 459 million parameter checkpoint that extends sound-effect tracks via causal continuation guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/base/audio-outpainting","tagline":"Stable Audio 3 Small SFX Base audio outpainting is the foundational 459 million parameter checkpoint that extends sound-effect tracks via causal continuation guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/base/audio-to-audio","name":"Stable Audio 3 Small SFX Base Audio to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX Base audio-to-audio is the foundational 459 million parameter checkpoint that transforms input audio into new sound-effect variations guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/base/audio-to-audio","tagline":"Stable Audio 3 Small SFX Base audio-to-audio is the foundational 459 million parameter checkpoint that transforms input audio into new sound-effect variations guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/base/text-to-audio","name":"Stable Audio 3 Small SFX Base Text to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX Base is the foundational 459 million parameter checkpoint generating sound effects from text prompts, intended as the unmodified base for fine-tuning.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/base/text-to-audio","tagline":"Stable Audio 3 Small SFX Base is the foundational 459 million parameter checkpoint generating sound effects from text prompts, intended as the unmodified base for fine-tuning.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/text-to-audio","name":"Stable Audio 3 Small SFX Text to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX is a 459 million parameter latent diffusion model that generates high-quality sound effects from text prompts, designed for on-device deployment on mobile phones and consumer ","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/text-to-audio","tagline":"Stable Audio 3 Small SFX is a 459 million parameter latent diffusion model that generates high-quality sound effects from text prompts, designed for on-device deployment on mobile phones and consumer ","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3-trainer","name":"Stable Audio 3 Trainer","created_by":"fal","source":"official","description":"Stable Audio 3 LoRA Trainer fine-tunes Stable Audio 3 base models on paired audio-caption datasets, producing compact LoRA weights that adapt generation toward a custom music style, sound palette, or ","status":"active","release_date":"2026-06-11","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3-trainer","tagline":"Stable Audio 3 LoRA Trainer fine-tunes Stable Audio 3 base models on paired audio-caption datasets, producing compact LoRA weights that adapt generation toward a custom music style, sound palette, or ","last_seen_at":"2026-06-14","last_updated":"2026-06-18"},{"id":"fal-ai/stable-audio","name":"Stable Audio Open","created_by":"fal","source":"official","description":"Open source text-to-audio model.","status":"active","release_date":"2024-01-04","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio","tagline":"Open source text-to-audio model.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/stable-avatar","name":"Stable Avatar","created_by":"fal","source":"official","description":"Stable Avatar generates audio-driven video avatars up to five minutes long","status":"active","release_date":"2025-08-14","model_type":"other","page_url":"https://fal.run/fal-ai/stable-avatar","tagline":"Stable Avatar generates audio-driven video avatars up to five minutes long","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-cascade/sote-diffusion","name":"SoteDiffusion","created_by":"fal","source":"official","description":"Anime finetune of Würstchen V3.","status":"active","release_date":"2024-06-10","model_type":"image","page_url":"https://fal.run/fal-ai/stable-cascade/sote-diffusion","tagline":"Anime finetune of Würstchen V3.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-cascade","name":"Stable Cascade","created_by":"fal","source":"official","description":"Stable Cascade: Image generation on a smaller & cheaper latent space.","status":"active","release_date":"2024-06-25","model_type":"image","page_url":"https://fal.run/fal-ai/stable-cascade","tagline":"Stable Cascade: Image generation on a smaller & cheaper latent space.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-diffusion-v15","name":"Stable Diffusion v1.5","created_by":"fal","source":"official","description":"Stable Diffusion v1.5","status":"active","release_date":"2024-04-16","model_type":"image","page_url":"https://fal.run/fal-ai/stable-diffusion-v15","tagline":"Stable Diffusion v1.5","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-diffusion-v3-medium/image-to-image","name":"Stable Diffusion V3","created_by":"fal","source":"official","description":"Stable Diffusion 3 Medium (Image to Image) is a Multimodal Diffusion Transformer (MMDiT) model that improves image quality, typography, prompt understanding, and efficiency.","status":"active","release_date":"2024-06-12","model_type":"image","page_url":"https://fal.run/fal-ai/stable-diffusion-v3-medium/image-to-image","tagline":"Stable Diffusion 3 Medium (Image to Image) is a Multimodal Diffusion Transformer (MMDiT) model that improves image quality, typography, prompt understanding, and efficiency.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-diffusion-v3-medium","name":"Stable Diffusion V3","created_by":"fal","source":"official","description":"Stable Diffusion 3 Medium (Text to Image) is a Multimodal Diffusion Transformer (MMDiT) model that improves image quality, typography, prompt understanding, and efficiency.","status":"active","release_date":"2024-08-20","model_type":"image","page_url":"https://fal.run/fal-ai/stable-diffusion-v3-medium","tagline":"Stable Diffusion 3 Medium (Text to Image) is a Multimodal Diffusion Transformer (MMDiT) model that improves image quality, typography, prompt understanding, and efficiency.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-diffusion-v35-large","name":"Stable Diffusion 3.5 Large","created_by":"fal","source":"official","description":"Stable Diffusion 3.5 Large is a Multimodal Diffusion Transformer (MMDiT) text-to-image model that features improved performance in image quality, typography, complex prompt understanding, and resource","status":"active","release_date":"2024-10-27","model_type":"image","page_url":"https://fal.run/fal-ai/stable-diffusion-v35-large","tagline":"Stable Diffusion 3.5 Large is a Multimodal Diffusion Transformer (MMDiT) text-to-image model that features improved performance in image quality, typography, complex prompt understanding, and resource","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/stable-diffusion-v35-medium","name":"Stable Diffusion 3.5 Medium","created_by":"fal","source":"official","description":"Stable Diffusion 3.5 Medium is a Multimodal Diffusion Transformer (MMDiT) text-to-image model that features improved performance in image quality, typography, complex prompt understanding, and resourc","status":"active","release_date":"2024-10-27","model_type":"image","page_url":"https://fal.run/fal-ai/stable-diffusion-v35-medium","tagline":"Stable Diffusion 3.5 Medium is a Multimodal Diffusion Transformer (MMDiT) text-to-image model that features improved performance in image quality, typography, complex prompt understanding, and resourc","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-video","name":"High Quality Stable Video Diffusion","created_by":"fal","source":"official","description":"Generate short video clips from your images using SVD v1.1","status":"active","release_date":"2024-09-16","model_type":"video","page_url":"https://fal.run/fal-ai/stable-video","tagline":"Generate short video clips from your images using SVD v1.1","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/star-vector","name":"StarVector","created_by":"fal","source":"official","description":"AI vectorization model that transforms raster images into scalable SVG graphics, preserving visual details while enabling infinite scaling and easy editing capabilities.","status":"active","release_date":"2025-04-01","model_type":"image","page_url":"https://fal.run/fal-ai/star-vector","tagline":"AI vectorization model that transforms raster images into scalable SVG graphics, preserving visual details while enabling infinite scaling and easy editing capabilities.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/step1x-edit","name":"Step1X Edit","created_by":"fal","source":"official","description":"Step1X-Edit transforms your photos with simple instructions into stunning, professional-quality edits—rivaling top proprietary tools.","status":"active","release_date":"2025-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/step1x-edit","tagline":"Step1X-Edit transforms your photos with simple instructions into stunning, professional-quality edits—rivaling top proprietary tools.","capabilities":{"vision":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"tools":["function_calling"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/stepx-edit2","name":"Stepx Edit2","created_by":"fal","source":"official","description":"Image-to-image editing with Step1X-Edit v2 from StepFun.","status":"active","release_date":"2025-12-09","model_type":"image","page_url":"https://fal.run/fal-ai/stepx-edit2","tagline":"Image-to-image editing with Step1X-Edit v2 from StepFun.","capabilities":{"vision":true,"reasoning":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/swin2sr","name":"SWIN2SR","created_by":"fal","source":"official","description":"Enhance low-resolution images with the superior quality of Swin2SR for sharper, clearer results.","status":"active","release_date":"2025-02-28","model_type":"image","page_url":"https://fal.run/fal-ai/swin2sr","tagline":"Enhance low-resolution images with the superior quality of Swin2SR for sharper, clearer results.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/switti/512","name":"Switti 512","created_by":"fal","source":"official","description":"Switti is a scale-wise transformer for fast text-to-image generation that outperforms existing T2I AR models and competes with state-of-the-art T2I diffusion models while being faster than distilled d","status":"active","release_date":"2024-12-31","model_type":"image","page_url":"https://fal.run/fal-ai/switti/512","tagline":"Switti is a scale-wise transformer for fast text-to-image generation that outperforms existing T2I AR models and competes with state-of-the-art T2I diffusion models while being faster than distilled d","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/switti","name":"Switti 1024","created_by":"fal","source":"official","description":"Switti is a scale-wise transformer for fast text-to-image generation that outperforms existing T2I AR models and competes with state-of-the-art T2I diffusion models while being faster than distilled d","status":"active","release_date":"2024-12-31","model_type":"image","page_url":"https://fal.run/fal-ai/switti","tagline":"Switti is a scale-wise transformer for fast text-to-image generation that outperforms existing T2I AR models and competes with state-of-the-art T2I diffusion models while being faster than distilled d","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/sync-lipsync/react-1","name":"Sync React-1","created_by":"fal","source":"official","description":"Use React-1 from SyncLabs to refine human emotions and do realistic lip-sync without losing details!","status":"active","release_date":"2025-12-10","model_type":"other","page_url":"https://fal.run/fal-ai/sync-lipsync/react-1","tagline":"Use React-1 from SyncLabs to refine human emotions and do realistic lip-sync without losing details!","last_seen_at":"2026-04-30","last_updated":"2026-05-11"},{"id":"fal-ai/sync-lipsync/v2/pro","name":"Sync Lipsync","created_by":"fal","source":"official","description":"Generate high-quality realistic lipsync animations from audio while preserving unique details like natural teeth and unique facial features using the state-of-the-art Sync Lipsync 2 Pro model.","status":"active","release_date":"2025-09-02","model_type":"other","page_url":"https://fal.run/fal-ai/sync-lipsync/v2/pro","tagline":"Generate high-quality realistic lipsync animations from audio while preserving unique details like natural teeth and unique facial features using the state-of-the-art Sync Lipsync 2 Pro model.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/sync-lipsync/v2","name":"Sync Lipsync 2.0","created_by":"fal","source":"official","description":"Generate realistic lipsync animations from audio using advanced algorithms for high-quality synchronization with Sync Lipsync 2.0 model","status":"active","release_date":"2025-04-01","model_type":"other","page_url":"https://fal.run/fal-ai/sync-lipsync/v2","tagline":"Generate realistic lipsync animations from audio using advanced algorithms for high-quality synchronization with Sync Lipsync 2.0 model","last_seen_at":"2026-06-26","last_updated":"2026-06-29"},{"id":"fal-ai/sync-lipsync/v3/image-to-video","name":"sync-3 Avatar Image to Video","created_by":"fal","source":"official","description":"sync-3 image to video turns a single still into a talking character, and works with any illustration or animated frame paired with a voice track","status":"active","release_date":"2026-06-22","model_type":"video","page_url":"https://fal.run/fal-ai/sync-lipsync/v3/image-to-video","tagline":"sync-3 image to video turns a single still into a talking character, and works with any illustration or animated frame paired with a voice track","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-23","last_updated":"2026-06-29"},{"id":"fal-ai/sync-lipsync/v3","name":"sync-3 Lipsync","created_by":"fal","source":"official","description":"sync-3 most powerful lipsync model yet, featuring native visual intelligence for professional-quality video.","status":"active","release_date":"2026-04-06","model_type":"other","page_url":"https://fal.run/fal-ai/sync-lipsync/v3","tagline":"sync-3 most powerful lipsync model yet, featuring native visual intelligence for professional-quality video.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/sync-lipsync","name":"sync.so -- lipsync 1.9.0-beta","created_by":"fal","source":"official","description":"Generate realistic lipsync animations from audio using advanced algorithms for high-quality synchronization.","status":"active","release_date":"2025-01-13","model_type":"other","page_url":"https://fal.run/fal-ai/sync-lipsync","tagline":"Generate realistic lipsync animations from audio using advanced algorithms for high-quality synchronization.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/t2v-turbo","name":"T2V Turbo - Video Crafter","created_by":"fal","source":"official","description":"Generate short video clips from your prompts","status":"active","release_date":"2024-03-08","model_type":"video","page_url":"https://fal.run/fal-ai/t2v-turbo","tagline":"Generate short video clips from your prompts","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/tada/1b/text-to-speech","name":"Tada TTS 1B","created_by":"fal","source":"official","description":"A unified speech-language model that synchronizes speech and text into a single, cohesive stream via 1:1 alignment.","status":"active","release_date":"2026-03-12","model_type":"other","page_url":"https://fal.run/fal-ai/tada/1b/text-to-speech","tagline":"A unified speech-language model that synchronizes speech and text into a single, cohesive stream via 1:1 alignment.","last_seen_at":"2026-03-12","last_updated":"2026-05-11"},{"id":"fal-ai/tada/3b/text-to-speech","name":"Tada","created_by":"fal","source":"official","description":"A unified speech-language model that synchronizes speech and text into a single, cohesive stream via 1:1 alignment.","status":"active","release_date":"2026-03-12","model_type":"other","page_url":"https://fal.run/fal-ai/tada/3b/text-to-speech","tagline":"A unified speech-language model that synchronizes speech and text into a single, cohesive stream via 1:1 alignment.","last_seen_at":"2026-03-12","last_updated":"2026-05-11"},{"id":"fal-ai/telestyle-v2","name":"Telestyle V2 Style Transfer","created_by":"fal","source":"official","description":"Restyle any image with TeleStyle v2 — provide an original image and a styling reference, and the model re-renders the original in the reference's visual style while preserving its content and composit","status":"active","release_date":"2026-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/telestyle-v2","tagline":"Restyle any image with TeleStyle v2 — provide an original image and a styling reference, and the model re-renders the original in the reference's visual style while preserving its content and composit","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/thera","name":"Thera","created_by":"fal","source":"official","description":"Fix low resolution images with fast speed and quality of thera.","status":"active","release_date":"2025-03-24","model_type":"image","page_url":"https://fal.run/fal-ai/thera","tagline":"Fix low resolution images with fast speed and quality of thera.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/thinksound/audio","name":"ThinkSound","created_by":"fal","source":"official","description":"Generate realistic audio from a video with an optional text prompt","status":"active","release_date":"2025-07-02","model_type":"other","page_url":"https://fal.run/fal-ai/thinksound/audio","tagline":"Generate realistic audio from a video with an optional text prompt","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/thinksound","name":"ThinkSound","created_by":"fal","source":"official","description":"Generate realistic audio for a video with an optional text prompt and combine","status":"active","release_date":"2025-07-01","model_type":"other","page_url":"https://fal.run/fal-ai/thinksound","tagline":"Generate realistic audio for a video with an optional text prompt and combine","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/topaz/upscale/image","name":"Topaz","created_by":"fal","source":"official","description":"Use the powerful and accurate topaz image enhancer to enhance your images.","status":"active","release_date":"2025-06-27","model_type":"image","page_url":"https://fal.run/fal-ai/topaz/upscale/image","tagline":"Use the powerful and accurate topaz image enhancer to enhance your images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-26","last_updated":"2026-06-03"},{"id":"fal-ai/topaz/upscale/video","name":"Topaz Video Upscale","created_by":"fal","source":"official","description":"Professional-grade video upscaling using Topaz technology.","status":"active","release_date":"2025-03-04","model_type":"other","page_url":"https://fal.run/fal-ai/topaz/upscale/video","tagline":"Professional-grade video upscaling using Topaz technology.","last_seen_at":"2026-05-26","last_updated":"2026-06-03"},{"id":"fal-ai/transpixar","name":"TransPixar V1","created_by":"fal","source":"official","description":"Transform text into stunning videos with TransPixar - an AI model that generates both RGB footage and alpha channels, enabling seamless compositing and creative video effects.","status":"active","release_date":"2025-01-14","model_type":"video","page_url":"https://fal.run/fal-ai/transpixar","tagline":"Transform text into stunning videos with TransPixar - an AI model that generates both RGB footage and alpha channels, enabling seamless compositing and creative video effects.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/trellis-2/retexture","name":"Trellis 2","created_by":"fal","source":"official","description":"Generate 3D models from your images using Trellis 2.","status":"active","release_date":"2026-03-02","model_type":"other","page_url":"https://fal.run/fal-ai/trellis-2/retexture","tagline":"Generate 3D models from your images using Trellis 2.","capabilities":{"vision":true},"last_seen_at":"2026-03-02","last_updated":"2026-05-11"},{"id":"fal-ai/trellis-2","name":"Trellis 2","created_by":"fal","source":"official","description":"Generate 3D models from your images using Trellis 2.","status":"active","release_date":"2025-12-17","model_type":"other","page_url":"https://fal.run/fal-ai/trellis-2","tagline":"Generate 3D models from your images using Trellis 2.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/trellis/multi","name":"Trellis","created_by":"fal","source":"official","description":"Generate 3D models from multiple images using Trellis.","status":"active","release_date":"2025-05-02","model_type":"other","page_url":"https://fal.run/fal-ai/trellis/multi","tagline":"Generate 3D models from multiple images using Trellis.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/trellis","name":"Trellis","created_by":"fal","source":"official","description":"Generate 3D models from your images using Trellis.","status":"active","release_date":"2024-12-13","model_type":"other","page_url":"https://fal.run/fal-ai/trellis","tagline":"Generate 3D models from your images using Trellis.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/triposr","name":"TripoSR","created_by":"fal","source":"official","description":"State of the art Image to 3D Object generation","status":"active","release_date":"2024-01-30","model_type":"other","page_url":"https://fal.run/fal-ai/triposr","tagline":"State of the art Image to 3D Object generation","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/turbo-flux-trainer","name":"Turbo Flux Trainer","created_by":"fal","source":"official","description":"A blazing fast FLUX dev LoRA trainer for subjects and styles.","status":"active","release_date":"2025-04-17","model_type":"other","page_url":"https://fal.run/fal-ai/turbo-flux-trainer","tagline":"A blazing fast FLUX dev LoRA trainer for subjects and styles.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ultrashape","name":"Ultrashape","created_by":"fal","source":"official","description":"UltraShape-1.0 is a 3D diffusion framework that generates high-fidelity 3D geometry through coarse-to-fine geometric refinement.","status":"active","release_date":"2026-01-06","model_type":"other","page_url":"https://fal.run/fal-ai/ultrashape","tagline":"UltraShape-1.0 is a 3D diffusion framework that generates high-fidelity 3D geometry through coarse-to-fine geometric refinement.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/uno","name":"Uno","created_by":"fal","source":"official","description":"An AI model that transforms input images into new ones based on text prompts, blending reference visuals with your creative directions.","status":"active","release_date":"2025-04-24","model_type":"image","page_url":"https://fal.run/fal-ai/uno","tagline":"An AI model that transforms input images into new ones based on text prompts, blending reference visuals with your creative directions.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/uso","name":"Uso","created_by":"fal","source":"official","description":"Use USO to perform subject driven generations using reference image.","status":"active","release_date":"2025-08-30","model_type":"image","page_url":"https://fal.run/fal-ai/uso","tagline":"Use USO to perform subject driven generations using reference image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/vecglypher/image-to-svg","name":"Vecglypher","created_by":"fal","source":"official","description":"Vector font generation with VecGlypher.","status":"active","release_date":"2026-03-10","model_type":"image","page_url":"https://fal.run/fal-ai/vecglypher/image-to-svg","tagline":"Vector font generation with VecGlypher.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-10","last_updated":"2026-05-11"},{"id":"fal-ai/vecglypher","name":"Vecglypher","created_by":"fal","source":"official","description":"Vector font generation with VecGlypher.","status":"active","release_date":"2026-03-10","model_type":"image","page_url":"https://fal.run/fal-ai/vecglypher","tagline":"Vector font generation with VecGlypher.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-10","last_updated":"2026-05-11"},{"id":"fal-ai/veo2/image-to-video","name":"Veo 2 (Image to Video)","created_by":"fal","source":"official","description":"Veo 2 creates videos from images with realistic motion and very high quality output.","status":"active","release_date":"2025-03-11","model_type":"video","page_url":"https://fal.run/fal-ai/veo2/image-to-video","tagline":"Veo 2 creates videos from images with realistic motion and very high quality output.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo2","name":"Veo 2","created_by":"fal","source":"official","description":"Veo 2 creates videos with realistic motion and high quality output.","status":"active","release_date":"2025-02-21","model_type":"video","page_url":"https://fal.run/fal-ai/veo2","tagline":"Veo 2 creates videos with realistic motion and high quality output.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3/fast/image-to-video","name":"Veo 3 Fast [Image to Video]","created_by":"fal","source":"official","description":"Now with a 50% price drop.","status":"active","release_date":"2025-07-09","model_type":"video","page_url":"https://fal.run/fal-ai/veo3/fast/image-to-video","tagline":"Now with a 50% price drop.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3/fast","name":"Veo 3 Fast","created_by":"fal","source":"official","description":"Faster and more cost effective version of Google's Veo 3! ","status":"active","release_date":"2025-07-09","model_type":"video","page_url":"https://fal.run/fal-ai/veo3/fast","tagline":"Faster and more cost effective version of Google's Veo 3! ","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3/image-to-video","name":"Veo3","created_by":"fal","source":"official","description":"Veo 3 is the latest state-of-the art video generation model from Google DeepMind","status":"active","release_date":"2025-08-01","model_type":"video","page_url":"https://fal.run/fal-ai/veo3/image-to-video","tagline":"Veo 3 is the latest state-of-the art video generation model from Google DeepMind","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/extend-video","name":"Veo 3.1","created_by":"fal","source":"official","description":"Extend Veo-Created Videos up to 30 seconds","status":"active","release_date":"2025-12-15","model_type":"other","page_url":"https://fal.run/fal-ai/veo3.1/extend-video","tagline":"Extend Veo-Created Videos up to 30 seconds","last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/fast/extend-video","name":"Veo 3.1 Fast","created_by":"fal","source":"official","description":"Extend Veo-Created Videos up to 30 seconds","status":"active","release_date":"2025-12-15","model_type":"other","page_url":"https://fal.run/fal-ai/veo3.1/fast/extend-video","tagline":"Extend Veo-Created Videos up to 30 seconds","last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/fast/first-last-frame-to-video","name":"Veo 3.1 Fast","created_by":"fal","source":"official","description":"Generate videos from a first/last frame using Google's Veo 3.1 Fast","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/fast/first-last-frame-to-video","tagline":"Generate videos from a first/last frame using Google's Veo 3.1 Fast","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/fast/image-to-video","name":"Veo 3.1 Fast","created_by":"fal","source":"official","description":"Generate videos from your image prompts using Veo 3.1 fast.","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/fast/image-to-video","tagline":"Generate videos from your image prompts using Veo 3.1 fast.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/fast/reference-to-video","name":"Veo 3.1 Fast","created_by":"fal","source":"official","description":"Generate videos from reference images using Google's Veo 3.1 Fast","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/fast/reference-to-video","tagline":"Generate videos from reference images using Google's Veo 3.1 Fast","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-05-11","last_updated":"2026-06-03"},{"id":"fal-ai/veo3.1/fast","name":"Veo 3.1 Fast","created_by":"fal","source":"official","description":"Faster and more cost effective version of Google's Veo 3.1! ","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/fast","tagline":"Faster and more cost effective version of Google's Veo 3.1! ","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/first-last-frame-to-video","name":"Veo 3.1","created_by":"fal","source":"official","description":"Generate videos from a first and last framed using Google's Veo 3.1","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/first-last-frame-to-video","tagline":"Generate videos from a first and last framed using Google's Veo 3.1","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/image-to-video","name":"Veo 3.1","created_by":"fal","source":"official","description":"Veo 3.1 is the latest state-of-the art video generation model from Google DeepMind","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/image-to-video","tagline":"Veo 3.1 is the latest state-of-the art video generation model from Google DeepMind","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/lite/first-last-frame-to-video","name":"Veo3.1 Lite FLF","created_by":"fal","source":"official","description":"Veo 3.1 Lite balances practical utility with professional capabilities, supporting Text-to-Video and Image-to-Video","status":"active","release_date":"2026-03-31","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/lite/first-last-frame-to-video","tagline":"Veo 3.1 Lite balances practical utility with professional capabilities, supporting Text-to-Video and Image-to-Video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/lite/image-to-video","name":"Veo3.1 Lite Image to Video","created_by":"fal","source":"official","description":"Veo 3.1 Lite balances practical utility with professional capabilities, supporting Text-to-Video and Image-to-Video","status":"active","release_date":"2026-03-31","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/lite/image-to-video","tagline":"Veo 3.1 Lite balances practical utility with professional capabilities, supporting Text-to-Video and Image-to-Video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/lite","name":"Veo3.1 Lite Text to Video","created_by":"fal","source":"official","description":"Veo 3.1 Lite balances practical utility with professional capabilities, supporting Text-to-Video and Image-to-Video","status":"active","release_date":"2026-03-31","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/lite","tagline":"Veo 3.1 Lite balances practical utility with professional capabilities, supporting Text-to-Video and Image-to-Video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/reference-to-video","name":"Veo 3.1","created_by":"fal","source":"official","description":"Generate Videos from images using Google's Veo 3.1","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/reference-to-video","tagline":"Generate Videos from images using Google's Veo 3.1","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1","name":"Veo 3.1","created_by":"fal","source":"official","description":"Veo 3.1 by Google, the most advanced AI video generation model in the world.","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1","tagline":"Veo 3.1 by Google, the most advanced AI video generation model in the world.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3","name":"Veo 3","created_by":"fal","source":"official","description":"Veo 3 by Google, the most advanced AI video generation model in the world.","status":"active","release_date":"2025-06-05","model_type":"video","page_url":"https://fal.run/fal-ai/veo3","tagline":"Veo 3 by Google, the most advanced AI video generation model in the world.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/vibevoice/0.5b","name":"Vibevoice","created_by":"fal","source":"official","description":"Generate long speech snippets fast using Microsoft's powerful TTS.","status":"active","release_date":"2025-12-17","model_type":"tts","page_url":"https://fal.run/fal-ai/vibevoice/0.5b","tagline":"Generate long speech snippets fast using Microsoft's powerful TTS.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/vibevoice/7b","name":"VibeVoice 7B","created_by":"fal","source":"official","description":"Generate long, expressive multi-voice speech using Microsoft's powerful TTS","status":"active","release_date":"2025-08-27","model_type":"tts","page_url":"https://fal.run/fal-ai/vibevoice/7b","tagline":"Generate long, expressive multi-voice speech using Microsoft's powerful TTS","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/vibevoice","name":"VibeVoice 1.5B","created_by":"fal","source":"official","description":"Generate long, expressive multi-voice speech using Microsoft's powerful TTS","status":"active","release_date":"2025-08-27","model_type":"tts","page_url":"https://fal.run/fal-ai/vibevoice","tagline":"Generate long, expressive multi-voice speech using Microsoft's powerful TTS","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/video-as-prompt","name":"Video As Prompt","created_by":"fal","source":"official","description":"A model for unified semantic control in video generation.","status":"active","release_date":"2025-10-29","model_type":"other","page_url":"https://fal.run/fal-ai/video-as-prompt","tagline":"A model for unified semantic control in video generation.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/video-prompt-generator","name":"Video Prompt Generator","created_by":"fal","source":"official","description":"Generate video prompts using a variety of techniques including camera direction, style, pacing, special effects and more.","status":"active","release_date":"2025-02-25","model_type":"other","page_url":"https://fal.run/fal-ai/video-prompt-generator","tagline":"Generate video prompts using a variety of techniques including camera direction, style, pacing, special effects and more.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/video-understanding","name":"Video Understanding","created_by":"fal","source":"official","description":"A video understanding model to analyze video content and answer questions about what's happening in the video based on user prompts.","status":"active","release_date":"2025-06-20","model_type":"other","page_url":"https://fal.run/fal-ai/video-understanding","tagline":"A video understanding model to analyze video content and answer questions about what's happening in the video based on user prompts.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/video-upscaler","name":"Video Upscaler","created_by":"fal","source":"official","description":"The video upscaler endpoint uses RealESRGAN on each frame of the input video to upscale the video to a higher resolution.","status":"active","release_date":"2024-12-04","model_type":"other","page_url":"https://fal.run/fal-ai/video-upscaler","tagline":"The video upscaler endpoint uses RealESRGAN on each frame of the input video to upscale the video to a higher resolution.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/image-to-video","name":"Vidu Image to Video","created_by":"fal","source":"official","description":"Vidu Image to Video generates high-quality videos with exceptional visual quality and motion diversity from a single image","status":"active","release_date":"2025-03-12","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/image-to-video","tagline":"Vidu Image to Video generates high-quality videos with exceptional visual quality and motion diversity from a single image","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q1/image-to-video","name":"Vidu Image to Video","created_by":"fal","source":"official","description":"Vidu Q1 Image to Video generates high-quality 1080p videos with exceptional visual quality and motion diversity from a single image","status":"active","release_date":"2025-05-09","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q1/image-to-video","tagline":"Vidu Q1 Image to Video generates high-quality 1080p videos with exceptional visual quality and motion diversity from a single image","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q1/reference-to-video","name":"Vidu","created_by":"fal","source":"official","description":"Generate video clips from your multiple image references using Vidu Q1","status":"active","release_date":"2025-07-08","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q1/reference-to-video","tagline":"Generate video clips from your multiple image references using Vidu Q1","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q1/start-end-to-video","name":"Vidu Start End to Video","created_by":"fal","source":"official","description":"Vidu Q1 Start-End to Video generates smooth transition 1080p videos between specified start and end images.","status":"active","release_date":"2025-05-09","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q1/start-end-to-video","tagline":"Vidu Q1 Start-End to Video generates smooth transition 1080p videos between specified start and end images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q1/text-to-video","name":"Vidu Text to Video","created_by":"fal","source":"official","description":"Vidu Q1 Text to Video generates high-quality 1080p videos with exceptional visual quality and motion diversity","status":"active","release_date":"2025-05-09","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q1/text-to-video","tagline":"Vidu Q1 Text to Video generates high-quality 1080p videos with exceptional visual quality and motion diversity","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q2/image-to-video/pro","name":"Vidu","created_by":"fal","source":"official","description":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","status":"active","release_date":"2025-10-24","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q2/image-to-video/pro","tagline":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q2/image-to-video/turbo","name":"Vidu","created_by":"fal","source":"official","description":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","status":"active","release_date":"2025-10-24","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q2/image-to-video/turbo","tagline":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q2/reference-to-image","name":"Vidu","created_by":"fal","source":"official","description":"Vidu Reference-to-Image creates images by using a reference images and combining them with a prompt.","status":"active","release_date":"2025-12-02","model_type":"image","page_url":"https://fal.run/fal-ai/vidu/q2/reference-to-image","tagline":"Vidu Reference-to-Image creates images by using a reference images and combining them with a prompt.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q2/reference-to-video/pro","name":"Vidu","created_by":"fal","source":"official","description":"Use the latest Vidu Q2 Pro models which much more better quality and control on your videos.","status":"active","release_date":"2026-01-19","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q2/reference-to-video/pro","tagline":"Use the latest Vidu Q2 Pro models which much more better quality and control on your videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q2/text-to-image","name":"Vidu","created_by":"fal","source":"official","description":"Use vidu Text-to-Image to turn your prompts into reality.","status":"active","release_date":"2025-12-02","model_type":"image","page_url":"https://fal.run/fal-ai/vidu/q2/text-to-image","tagline":"Use vidu Text-to-Image to turn your prompts into reality.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q2/text-to-video","name":"Vidu","created_by":"fal","source":"official","description":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","status":"active","release_date":"2025-10-22","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q2/text-to-video","tagline":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q2/video-extension/pro","name":"Vidu","created_by":"fal","source":"official","description":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","status":"active","release_date":"2025-10-24","model_type":"other","page_url":"https://fal.run/fal-ai/vidu/q2/video-extension/pro","tagline":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q3/image-to-video/turbo","name":"Vidu","created_by":"fal","source":"official","description":"Vidu's Q3 Turbo Model","status":"active","release_date":"2026-02-06","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q3/image-to-video/turbo","tagline":"Vidu's Q3 Turbo Model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q3/image-to-video","name":"Vidu","created_by":"fal","source":"official","description":"Vidu's latest Q3 pro models.","status":"active","release_date":"2026-01-31","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q3/image-to-video","tagline":"Vidu's latest Q3 pro models.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q3/reference-to-video/mix","name":"Vidu","created_by":"fal","source":"official","description":"Vidu's latest Q3 Reference to Video Mix model","status":"active","release_date":"2026-04-08","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q3/reference-to-video/mix","tagline":"Vidu's latest Q3 Reference to Video Mix model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q3/text-to-video/turbo","name":"Vidu","created_by":"fal","source":"official","description":"Vidu's Q3 Turbo Model.","status":"active","release_date":"2026-02-06","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q3/text-to-video/turbo","tagline":"Vidu's Q3 Turbo Model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q3/text-to-video","name":"Vidu","created_by":"fal","source":"official","description":"Vidu's latest Q3 pro models","status":"active","release_date":"2026-01-31","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q3/text-to-video","tagline":"Vidu's latest Q3 pro models","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/reference-to-image","name":"Vidu","created_by":"fal","source":"official","description":"Vidu Reference-to-Image creates images by using a reference images and combining them with a prompt.","status":"active","release_date":"2025-09-09","model_type":"image","page_url":"https://fal.run/fal-ai/vidu/reference-to-image","tagline":"Vidu Reference-to-Image creates images by using a reference images and combining them with a prompt.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/reference-to-video","name":"Vidu Reference to Video","created_by":"fal","source":"official","description":"Vidu Reference to Video creates videos by using a reference images and combining them with a prompt.","status":"active","release_date":"2025-03-12","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/reference-to-video","tagline":"Vidu Reference to Video creates videos by using a reference images and combining them with a prompt.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/start-end-to-video","name":"Vidu Start-End to Video","created_by":"fal","source":"official","description":"Vidu Start-End to Video generates smooth transition videos between specified start and end images.","status":"active","release_date":"2025-03-12","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/start-end-to-video","tagline":"Vidu Start-End to Video generates smooth transition videos between specified start and end images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/template-to-video","name":"Vidu Template to Video","created_by":"fal","source":"official","description":"Vidu Template to Video lets you create different effects by applying motion templates to your images.","status":"active","release_date":"2025-03-12","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/template-to-video","tagline":"Vidu Template to Video lets you create different effects by applying motion templates to your images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/void-video-inpainting","name":"Void Video Inpainting","created_by":"fal","source":"official","description":"VOID removes objects from videos along with all interactions they induce on the scene","status":"active","release_date":"2026-04-10","model_type":"other","page_url":"https://fal.run/fal-ai/void-video-inpainting","tagline":"VOID removes objects from videos along with all interactions they induce on the scene","last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/wan-22-image-trainer","name":"Wan 2.2 14B Image Trainer","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2 text to image LoRA trainer.","status":"active","release_date":"2025-08-11","model_type":"other","page_url":"https://fal.run/fal-ai/wan-22-image-trainer","tagline":"Wan 2.2 text to image LoRA trainer.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-22-trainer/i2v-a14b","name":"Wan-2.2 LoRA Trainer","created_by":"fal","source":"official","family":"wan","description":"Train custom LoRAs for Wan-2.2 T2V/I2V 480P","status":"active","release_date":"2026-02-23","model_type":"other","page_url":"https://fal.run/fal-ai/wan-22-trainer/i2v-a14b","tagline":"Train custom LoRAs for Wan-2.2 T2V/I2V 480P","last_seen_at":"2026-02-25","last_updated":"2026-05-11"},{"id":"fal-ai/wan-22-trainer/t2v-a14b","name":"Wan-2.2 LoRA Trainer","created_by":"fal","source":"official","family":"wan","description":"Train custom LoRAs for Wan-2.2 T2V/I2V 480P","status":"active","release_date":"2026-02-23","model_type":"other","page_url":"https://fal.run/fal-ai/wan-22-trainer/t2v-a14b","tagline":"Train custom LoRAs for Wan-2.2 T2V/I2V 480P","last_seen_at":"2026-02-25","last_updated":"2026-05-11"},{"id":"fal-ai/wan-22-vace-fun-a14b/depth","name":"Wan 2.2 VACE Fun A14B","created_by":"fal","source":"official","family":"wan","description":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","status":"active","release_date":"2025-09-17","model_type":"other","page_url":"https://fal.run/fal-ai/wan-22-vace-fun-a14b/depth","tagline":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-22-vace-fun-a14b/inpainting","name":"Wan 2.2 VACE Fun A14B","created_by":"fal","source":"official","family":"wan","description":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","status":"active","release_date":"2025-09-17","model_type":"other","page_url":"https://fal.run/fal-ai/wan-22-vace-fun-a14b/inpainting","tagline":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-22-vace-fun-a14b/outpainting","name":"Wan 2.2 VACE Fun A14B","created_by":"fal","source":"official","family":"wan","description":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","status":"active","release_date":"2025-09-17","model_type":"other","page_url":"https://fal.run/fal-ai/wan-22-vace-fun-a14b/outpainting","tagline":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-22-vace-fun-a14b/reframe","name":"Wan 2.2 VACE Fun A14B","created_by":"fal","source":"official","family":"wan","description":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","status":"active","release_date":"2025-09-17","model_type":"other","page_url":"https://fal.run/fal-ai/wan-22-vace-fun-a14b/reframe","tagline":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-25-preview/image-to-image","name":"Wan 2.5 Image to Image","created_by":"fal","source":"official","family":"wan","description":"Wan 2.5 image-to-image model.","status":"active","release_date":"2025-09-25","model_type":"image","page_url":"https://fal.run/fal-ai/wan-25-preview/image-to-image","tagline":"Wan 2.5 image-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan-25-preview/image-to-video","name":"Wan 2.5 Image to Video","created_by":"fal","source":"official","family":"wan","description":"Wan 2.5 image-to-video model.","status":"active","release_date":"2025-09-24","model_type":"video","page_url":"https://fal.run/fal-ai/wan-25-preview/image-to-video","tagline":"Wan 2.5 image-to-video model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan-25-preview/text-to-image","name":"Wan 2.5 Text to Image","created_by":"fal","source":"official","family":"wan","description":"Wan 2.5 text-to-image model.","status":"active","release_date":"2025-09-25","model_type":"image","page_url":"https://fal.run/fal-ai/wan-25-preview/text-to-image","tagline":"Wan 2.5 text-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan-25-preview/text-to-video","name":"Wan 2.5 Text to Video","created_by":"fal","source":"official","family":"wan","description":"Wan 2.5 text-to-video model.","status":"active","release_date":"2025-09-24","model_type":"video","page_url":"https://fal.run/fal-ai/wan-25-preview/text-to-video","tagline":"Wan 2.5 text-to-video model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/wan-alpha","name":"Wan Alpha","created_by":"fal","source":"official","family":"wan","description":"Generate videos with transparent backgrounds","status":"active","release_date":"2025-10-16","model_type":"video","page_url":"https://fal.run/fal-ai/wan-alpha","tagline":"Generate videos with transparent backgrounds","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-ati","name":"Wan Ati","created_by":"fal","source":"official","family":"wan","description":"WAN-ATI is a controllable video generation model that uses trajectory instructions to guide object, local, and camera motion, enabling precise and flexible image-to-video creation.","status":"active","release_date":"2025-08-29","model_type":"video","page_url":"https://fal.run/fal-ai/wan-ati","tagline":"WAN-ATI is a controllable video generation model that uses trajectory instructions to guide object, local, and camera motion, enabling precise and flexible image-to-video creation.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-effects","name":"Wan Effects","created_by":"fal","source":"official","family":"wan","description":"Wan Effects generates high-quality videos with popular effects from images","status":"active","release_date":"2025-03-13","model_type":"video","page_url":"https://fal.run/fal-ai/wan-effects","tagline":"Wan Effects generates high-quality videos with popular effects from images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-flf2v","name":"Wan-2.1 First-Last-Frame-to-Video","created_by":"fal","source":"official","family":"wan","description":"Wan-2.1 flf2v generates dynamic videos by intelligently bridging a given first frame to a desired end frame through smooth, coherent motion sequences.","status":"active","release_date":"2025-04-17","model_type":"video","page_url":"https://fal.run/fal-ai/wan-flf2v","tagline":"Wan-2.1 flf2v generates dynamic videos by intelligently bridging a given first frame to a desired end frame through smooth, coherent motion sequences.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-fun-control","name":"Wan 2.2 Fun Control","created_by":"fal","source":"official","family":"wan","description":"Generate pose or depth controlled video using Alibaba-PAI's Wan 2.2 Fun","status":"active","release_date":"2025-08-28","model_type":"other","page_url":"https://fal.run/fal-ai/wan-fun-control","tagline":"Generate pose or depth controlled video using Alibaba-PAI's Wan 2.2 Fun","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-i2v-lora","name":"Wan-2.1 Image-to-Video with LoRAs","created_by":"fal","source":"official","family":"wan","description":"Add custom LoRAs to Wan-2.1 is a image-to-video model that generates high-quality videos with high visual quality and motion diversity from images","status":"active","release_date":"2025-03-08","model_type":"video","page_url":"https://fal.run/fal-ai/wan-i2v-lora","tagline":"Add custom LoRAs to Wan-2.1 is a image-to-video model that generates high-quality videos with high visual quality and motion diversity from images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-i2v","name":"Wan-2.1 Image-to-Video","created_by":"fal","source":"official","family":"wan","description":"Wan-2.1 is a image-to-video model that generates high-quality videos with high visual quality and motion diversity from images","status":"active","release_date":"2025-02-25","model_type":"video","page_url":"https://fal.run/fal-ai/wan-i2v","tagline":"Wan-2.1 is a image-to-video model that generates high-quality videos with high visual quality and motion diversity from images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-motion","name":"Wan Motion","created_by":"fal","source":"official","family":"wan","description":"Wan Motion is a streamlined character animation model that transfers motion from a driving video onto a reference character image.","status":"active","release_date":"2026-02-19","model_type":"other","page_url":"https://fal.run/fal-ai/wan-motion","tagline":"Wan Motion is a streamlined character animation model that transfers motion from a driving video onto a reference character image.","capabilities":{"vision":true},"last_seen_at":"2026-02-23","last_updated":"2026-05-11"},{"id":"fal-ai/wan-move","name":"Wan Move [480p]","created_by":"fal","source":"official","family":"wan","description":"Use Wan-Move to generate videos with controlled the motion using trajectories","status":"active","release_date":"2025-12-24","model_type":"video","page_url":"https://fal.run/fal-ai/wan-move","tagline":"Use Wan-Move to generate videos with controlled the motion using trajectories","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-pro/image-to-video","name":"Wan-2.1 Pro Image-to-Video","created_by":"fal","source":"official","family":"wan","description":"Wan-2.1 Pro is a premium image-to-video model that generates high-quality 1080p videos at 30fps with up to 6 seconds duration, delivering exceptional visual quality and motion diversity from images","status":"active","release_date":"2025-03-11","model_type":"video","page_url":"https://fal.run/fal-ai/wan-pro/image-to-video","tagline":"Wan-2.1 Pro is a premium image-to-video model that generates high-quality 1080p videos at 30fps with up to 6 seconds duration, delivering exceptional visual quality and motion diversity from images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan-pro/text-to-video","name":"Wan-2.1 Pro Text-to-Video","created_by":"fal","source":"official","family":"wan","description":"Wan-2.1 Pro is a premium text-to-video model that generates high-quality 1080p videos at 30fps with up to 6 seconds duration, delivering exceptional visual quality and motion diversity from text promp","status":"active","release_date":"2025-03-11","model_type":"video","page_url":"https://fal.run/fal-ai/wan-pro/text-to-video","tagline":"Wan-2.1 Pro is a premium text-to-video model that generates high-quality 1080p videos at 30fps with up to 6 seconds duration, delivering exceptional visual quality and motion diversity from text promp","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan-t2v-lora","name":"Wan-2.1 Text-to-Video with LoRAs","created_by":"fal","source":"official","family":"wan","description":"Add custom LoRAs to Wan-2.1 is a text-to-video model that generates high-quality videos with high visual quality and motion diversity from images","status":"active","release_date":"2025-03-25","model_type":"video","page_url":"https://fal.run/fal-ai/wan-t2v-lora","tagline":"Add custom LoRAs to Wan-2.1 is a text-to-video model that generates high-quality videos with high visual quality and motion diversity from images","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-t2v","name":"Wan-2.1 Text-to-Video","created_by":"fal","source":"official","family":"wan","description":"Wan-2.1 is a text-to-video model that generates high-quality videos with high visual quality and motion diversity from text prompts","status":"active","release_date":"2025-02-25","model_type":"video","page_url":"https://fal.run/fal-ai/wan-t2v","tagline":"Wan-2.1 is a text-to-video model that generates high-quality videos with high visual quality and motion diversity from text prompts","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-trainer/flf2v-720p","name":"Wan-2.1 LoRA Trainer","created_by":"fal","source":"official","family":"wan","description":"Train custom LoRAs for Wan-2.1 FLF2V 720P","status":"active","release_date":"2025-06-11","model_type":"other","page_url":"https://fal.run/fal-ai/wan-trainer/flf2v-720p","tagline":"Train custom LoRAs for Wan-2.1 FLF2V 720P","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-trainer/i2v-720p","name":"Wan-2.1 LoRA Trainer","created_by":"fal","source":"official","family":"wan","description":"Train custom LoRAs for Wan-2.1 I2V 720P","status":"active","release_date":"2025-06-11","model_type":"other","page_url":"https://fal.run/fal-ai/wan-trainer/i2v-720p","tagline":"Train custom LoRAs for Wan-2.1 I2V 720P","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-trainer/t2v-14b","name":"Wan-2.1 LoRA Trainer","created_by":"fal","source":"official","family":"wan","description":"Train custom LoRAs for Wan-2.1 T2V 14B","status":"active","release_date":"2025-06-11","model_type":"other","parameters":14,"page_url":"https://fal.run/fal-ai/wan-trainer/t2v-14b","tagline":"Train custom LoRAs for Wan-2.1 T2V 14B","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-trainer/t2v","name":"Wan-2.1 LoRA Trainer","created_by":"fal","source":"official","family":"wan","description":"Train custom LoRAs for Wan-2.1 T2V 1.3B","status":"active","release_date":"2025-06-11","model_type":"other","page_url":"https://fal.run/fal-ai/wan-trainer/t2v","tagline":"Train custom LoRAs for Wan-2.1 T2V 1.3B","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-trainer","name":"Wan-2.1 LoRA Trainer","created_by":"fal","source":"official","family":"wan","description":"Train custom LoRAs for Wan-2.1 I2V 480P","status":"active","release_date":"2025-03-24","model_type":"other","page_url":"https://fal.run/fal-ai/wan-trainer","tagline":"Train custom LoRAs for Wan-2.1 I2V 480P","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.1/1.3b/text-to-video","name":"Wan-2.1 1.3B Text-to-Video","created_by":"fal","source":"official","family":"wan","description":"Wan-2.1 1.3B is a text-to-video model that generates high-quality videos with high visual quality and motion diversity from text promptsat faster speeds.","status":"active","release_date":"2025-02-27","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.1/1.3b/text-to-video","tagline":"Wan-2.1 1.3B is a text-to-video model that generates high-quality videos with high visual quality and motion diversity from text promptsat faster speeds.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-14b/animate/move","name":"Wan-2.2 Animate Move","created_by":"fal","source":"official","family":"wan","description":"Wan-Animate is a video model that generates high-fidelity character videos by replicating the expressions and movements of characters from reference videos.","status":"active","release_date":"2025-09-21","model_type":"other","page_url":"https://fal.run/fal-ai/wan/v2.2-14b/animate/move","tagline":"Wan-Animate is a video model that generates high-fidelity character videos by replicating the expressions and movements of characters from reference videos.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-14b/animate/replace","name":"Wan-2.2 Animate Replace","created_by":"fal","source":"official","family":"wan","description":"Wan-Animate Replace is a model that can integrate animated characters into reference videos, replacing the original character while preserving the scene’s lighting and color tone for seamless environm","status":"active","release_date":"2025-09-21","model_type":"other","page_url":"https://fal.run/fal-ai/wan/v2.2-14b/animate/replace","tagline":"Wan-Animate Replace is a model that can integrate animated characters into reference videos, replacing the original character while preserving the scene’s lighting and color tone for seamless environm","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-14b/speech-to-video","name":"Wan-2.2 Speech-to-Video 14B","created_by":"fal","source":"official","family":"wan","description":"Wan-S2V is a video model that generates high-quality videos from static images and audio, with realistic facial expressions, body movements, and professional camera work for film and television applic","status":"active","release_date":"2025-08-27","model_type":"other","page_url":"https://fal.run/fal-ai/wan/v2.2-14b/speech-to-video","tagline":"Wan-S2V is a video model that generates high-quality videos from static images and audio, with realistic facial expressions, body movements, and professional camera work for film and television applic","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan/v2.2-5b/image-to-video","name":"Wan v2.2 5B","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 5B model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","status":"active","release_date":"2025-07-30","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-5b/image-to-video","tagline":"Wan 2.2's 5B model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-5b/text-to-image","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 5B model generates high-resolution, photorealistic images with powerful prompt understanding and fine-grained visual detail","status":"active","release_date":"2025-08-05","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.2-5b/text-to-image","tagline":"Wan 2.2's 5B model generates high-resolution, photorealistic images with powerful prompt understanding and fine-grained visual detail","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan/v2.2-5b/text-to-video/distill","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 5B distill model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","status":"active","release_date":"2025-08-06","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-5b/text-to-video/distill","tagline":"Wan 2.2's 5B distill model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan/v2.2-5b/text-to-video/fast-wan","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 5B FastVideo model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","status":"active","release_date":"2025-08-05","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-5b/text-to-video/fast-wan","tagline":"Wan 2.2's 5B FastVideo model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan/v2.2-5b/text-to-video","name":"Wan v2.2 5B","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 5B model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","status":"active","release_date":"2025-07-28","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-5b/text-to-video","tagline":"Wan 2.2's 5B model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-a14b/image-to-image","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 14B model edit high-resolution, photorealistic images with powerful prompt understanding and fine-grained visual detail","status":"active","release_date":"2025-09-03","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/image-to-image","tagline":"Wan 2.2's 14B model edit high-resolution, photorealistic images with powerful prompt understanding and fine-grained visual detail","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-a14b/image-to-video/lora","name":"Wan v2.2 A14B Image-to-Video A14B with LoRAs","created_by":"fal","source":"official","family":"wan","description":"Wan-2.2 image-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts and images.","status":"active","release_date":"2025-08-07","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/image-to-video/lora","tagline":"Wan-2.2 image-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts and images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan/v2.2-a14b/image-to-video/turbo","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan-2.2 Turbo image-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","status":"active","release_date":"2025-07-31","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/image-to-video/turbo","tagline":"Wan-2.2 Turbo image-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-a14b/image-to-video","name":"Wan v2.2 A14B","created_by":"fal","source":"official","family":"wan","description":"fal-ai/wan/v2.2-A14B/image-to-video","status":"active","release_date":"2025-07-28","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-a14B/image-to-video","tagline":"fal-ai/wan/v2.2-A14B/image-to-video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-a14b/text-to-image/lora","name":"Wan v2.2 A14B Text-to-Image A14B with LoRAs","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 14B model with LoRA support generates high-fidelity images with enhanced prompt alignment, style adaptability.","status":"active","release_date":"2025-08-05","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/text-to-image/lora","tagline":"Wan 2.2's 14B model with LoRA support generates high-fidelity images with enhanced prompt alignment, style adaptability.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan/v2.2-a14b/text-to-image","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 14B model generates high-resolution, photorealistic images with powerful prompt understanding and fine-grained visual detail","status":"active","release_date":"2025-08-05","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/text-to-image","tagline":"Wan 2.2's 14B model generates high-resolution, photorealistic images with powerful prompt understanding and fine-grained visual detail","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-a14b/text-to-video/lora","name":"Wan-2.2 Text-to-Video A14B with LoRAs","created_by":"fal","source":"official","family":"wan","description":"Wan-2.2 text-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","status":"active","release_date":"2025-08-07","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/text-to-video/lora","tagline":"Wan-2.2 text-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan/v2.2-a14b/text-to-video/turbo","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan-2.2 turbo text-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","status":"active","release_date":"2025-07-31","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/text-to-video/turbo","tagline":"Wan-2.2 turbo text-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-a14b/text-to-video","name":"Wan-2.2 Text-to-Video A14B","created_by":"fal","source":"official","family":"wan","description":"Wan-2.2 text-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","status":"active","release_date":"2025-07-28","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/text-to-video","tagline":"Wan-2.2 text-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-a14b/video-to-video","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan-2.2 video-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts and source videos.","status":"active","release_date":"2025-08-02","model_type":"other","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/video-to-video","tagline":"Wan-2.2 video-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts and source videos.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/edit-video","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","status":"active","release_date":"2026-03-28","model_type":"other","page_url":"https://fal.run/fal-ai/wan/v2.7/edit-video","tagline":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/edit","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Transform and edit existing images with text-guided instructions using the WAN 2.7 model for creative image manipulation.","status":"active","release_date":"2026-04-01","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.7/edit","tagline":"Transform and edit existing images with text-guided instructions using the WAN 2.7 model for creative image manipulation.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/image-to-video","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","status":"active","release_date":"2026-03-28","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.7/image-to-video","tagline":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/pro/edit","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Edit and transform images using text instructions with the WAN 2.7 Pro model for precise, professional-grade image modifications.","status":"active","release_date":"2026-04-01","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.7/pro/edit","tagline":"Edit and transform images using text instructions with the WAN 2.7 Pro model for precise, professional-grade image modifications.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/pro/text-to-image","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Generate premium-quality images from text prompts using the enhanced WAN 2.7 Pro model with superior detail and composition.","status":"active","release_date":"2026-04-01","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.7/pro/text-to-image","tagline":"Generate premium-quality images from text prompts using the enhanced WAN 2.7 Pro model with superior detail and composition.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-20","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/reference-to-video","name":"Wan 2.7 Reference to Video","created_by":"fal","source":"official","family":"wan","description":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","status":"active","release_date":"2026-03-28","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.7/reference-to-video","tagline":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/text-to-image","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Generate high-quality images from text prompts using the WAN 2.7 model with advanced prompt understanding and detailed output.","status":"active","release_date":"2026-04-01","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.7/text-to-image","tagline":"Generate high-quality images from text prompts using the WAN 2.7 model with advanced prompt understanding and detailed output.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-20","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/text-to-video","name":"Wan Text to Video","created_by":"fal","source":"official","family":"wan","description":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","status":"active","release_date":"2026-03-28","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.7/text-to-video","tagline":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-1-3b","name":"Wan Vace 1 3b","created_by":"fal","source":"official","family":"wan","description":"Vace a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-06-04","model_type":"other","parameters":3,"page_url":"https://fal.run/fal-ai/wan-vace-1-3b","tagline":"Vace a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-14b/depth","name":"Wan VACE 14B","created_by":"fal","source":"official","family":"wan","description":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace-14b/depth","tagline":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-14b/inpainting","name":"Wan VACE 14B","created_by":"fal","source":"official","family":"wan","description":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace-14b/inpainting","tagline":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-14b/outpainting","name":"Wan VACE 14B","created_by":"fal","source":"official","family":"wan","description":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace-14b/outpainting","tagline":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-14b/pose","name":"Wan VACE 14B","created_by":"fal","source":"official","family":"wan","description":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace-14b/pose","tagline":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-14b/reframe","name":"Wan VACE 14B","created_by":"fal","source":"official","family":"wan","description":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace-14b/reframe","tagline":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-14b","name":"Wan VACE 14B","created_by":"fal","source":"official","family":"wan","description":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-05-27","model_type":"other","parameters":14,"page_url":"https://fal.run/fal-ai/wan-vace-14b","tagline":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-apps/long-reframe","name":"Wan 2.1 VACE Long Reframe","created_by":"fal","source":"official","family":"wan","description":"Reframe entire videos scene-by-scene using Wan VACE 2.1","status":"active","release_date":"2025-10-07","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace-apps/long-reframe","tagline":"Reframe entire videos scene-by-scene using Wan VACE 2.1","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-apps/video-edit","name":"Wan VACE Video Edit","created_by":"fal","source":"official","family":"wan","description":"Edit videos using plain language and Wan VACE","status":"active","release_date":"2025-09-22","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace-apps/video-edit","tagline":"Edit videos using plain language and Wan VACE","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace","name":"Vace","created_by":"fal","source":"official","family":"wan","description":"Vace a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-04-11","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace","tagline":"Vace a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vision-enhancer","name":"Wan Vision Enhancer","created_by":"fal","source":"official","family":"wan","description":"Wan Vision Enhancer for magnify/enhance video with high fidelity and creativity.","status":"active","release_date":"2025-12-10","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vision-enhancer","tagline":"Wan Vision Enhancer for magnify/enhance video with high fidelity and creativity.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wizper","name":"Wizper (Whisper v3 -- fal.ai edition)","created_by":"fal","source":"official","description":"[Experimental] Whisper v3 Large -- but optimized by our inference wizards.","status":"active","release_date":"2024-04-08","model_type":"transcription","page_url":"https://fal.run/fal-ai/wizper","tagline":"[Experimental] Whisper v3 Large -- but optimized by our inference wizards.","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/workflow-utilities/audio-compressor","name":"Workflow Utilities Audio Compressor","created_by":"fal","source":"official","description":"FFMPEG Utility for Audio Compression","status":"active","release_date":"2026-02-05","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/audio-compressor","tagline":"FFMPEG Utility for Audio Compression","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/auto-subtitle","name":"Workflow Utilities Auto Subtitle","created_by":"fal","source":"official","description":"Add automatic subtitles to videos","status":"active","release_date":"2025-11-04","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/auto-subtitle","tagline":"Add automatic subtitles to videos","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/blend-video","name":"Workflow Utilities Blend Video","created_by":"fal","source":"official","description":"FFMPEG Utility for Blending Videos","status":"active","release_date":"2026-02-05","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/blend-video","tagline":"FFMPEG Utility for Blending Videos","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/extract-nth-frame","name":"Workflow Utilities Extract Nth Frame","created_by":"fal","source":"official","description":"FFMPEG Untility for Extracting nth Frame","status":"active","release_date":"2026-02-05","model_type":"image","page_url":"https://fal.run/fal-ai/workflow-utilities/extract-nth-frame","tagline":"FFMPEG Untility for Extracting nth Frame","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/impulse-response","name":"Workflow Utilities Impulse Response","created_by":"fal","source":"official","description":"FFMPEG Utility for Impulse Response","status":"active","release_date":"2026-02-05","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/impulse-response","tagline":"FFMPEG Utility for Impulse Response","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/interleave-video","name":"Workflow Utilities Interleave Video","created_by":"fal","source":"official","description":"ffmpeg utility to interleave videos","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/interleave-video","tagline":"ffmpeg utility to interleave videos","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/pick-image-by-index","name":"Workflow Utilities Pick Image By Index","created_by":"fal","source":"official","description":"Choose the Nth image from an image URL list for workflows.","status":"active","release_date":"2026-04-29","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/pick-image-by-index","tagline":"Choose the Nth image from an image URL list for workflows.","capabilities":{"vision":true},"last_seen_at":"2026-04-30","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/reverse-video","name":"Workflow Utilities Reverse Video","created_by":"fal","source":"official","description":"FFMPEG Utility to Reverse Videos","status":"active","release_date":"2026-02-19","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/reverse-video","tagline":"FFMPEG Utility to Reverse Videos","last_seen_at":"2026-02-19","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/scale-video","name":"Workflow Utilities Scale Video","created_by":"fal","source":"official","description":"FFMPEG Utilities to Scale Videos","status":"active","release_date":"2026-02-16","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/scale-video","tagline":"FFMPEG Utilities to Scale Videos","last_seen_at":"2026-02-17","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/trim-video","name":"Workflow Utilities Trim Video","created_by":"fal","source":"official","description":"FFMPEG Utility for Trim Video","status":"active","release_date":"2026-02-11","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/trim-video","tagline":"FFMPEG Utility for Trim Video","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/x-ailab/nsfw","name":"NSFW Checker","created_by":"fal","source":"official","description":"Predict whether an image is NSFW or SFW.","status":"active","release_date":"2025-07-28","model_type":"other","page_url":"https://fal.run/fal-ai/x-ailab/nsfw","tagline":"Predict whether an image is NSFW or SFW.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/yue","name":"YuE: Lyrics to Song","created_by":"fal","source":"official","description":"YuE is a groundbreaking series of open-source foundation models designed for music generation, specifically for transforming lyrics into full songs.","status":"active","release_date":"2025-01-28","model_type":"other","page_url":"https://fal.run/fal-ai/yue","tagline":"YuE is a groundbreaking series of open-source foundation models designed for music generation, specifically for transforming lyrics into full songs.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/z-image/base/lora","name":"Z Image Base Lora","created_by":"fal","source":"official","description":"LoRA endpoint for Z-Image, the foundation model of the Z- Image family.","status":"active","release_date":"2026-01-27","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/base/lora","tagline":"LoRA endpoint for Z-Image, the foundation model of the Z- Image family.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-06-03"},{"id":"fal-ai/z-image-base-trainer","name":"Z-Image Trainer","created_by":"fal","source":"official","description":"Fast LoRA trainer for Z-Image, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/z-image-base-trainer","tagline":"Fast LoRA trainer for Z-Image, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/z-image/base","name":"Z Image Base","created_by":"fal","source":"official","description":"Z-Image is the foundation model of the Z- Image family, engineered for good quality, robust generative diversity, broad stylistic coverage, and precise prompt adherence.","status":"active","release_date":"2026-01-27","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/base","tagline":"Z-Image is the foundation model of the Z- Image family, engineered for good quality, robust generative diversity, broad stylistic coverage, and precise prompt adherence.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/z-image-trainer","name":"Z Image Trainer","created_by":"fal","source":"official","description":"Train LoRAs on Z-Image Turbo, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","status":"active","release_date":"2025-12-03","model_type":"other","page_url":"https://fal.run/fal-ai/z-image-trainer","tagline":"Train LoRAs on Z-Image Turbo, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/z-image/turbo/controlnet/lora","name":"Z Image Turbo Controlnet Lora","created_by":"fal","source":"official","description":"Generate images from text and edge, depth or pose images using custom LoRA and Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","status":"active","release_date":"2025-12-07","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/controlnet/lora","tagline":"Generate images from text and edge, depth or pose images using custom LoRA and Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/controlnet","name":"Z Image Turbo Controlnet","created_by":"fal","source":"official","description":"Generate images from text and edge, depth or pose images using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","status":"active","release_date":"2025-12-07","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/controlnet","tagline":"Generate images from text and edge, depth or pose images using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/image-to-image/lora","name":"Z Image Turbo Image To Image Lora","created_by":"fal","source":"official","description":"Generate images from text and images using custom LoRA and Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","status":"active","release_date":"2025-12-07","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/image-to-image/lora","tagline":"Generate images from text and images using custom LoRA and Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/image-to-image","name":"Z Image Turbo Image To Image","created_by":"fal","source":"official","description":"Generate images from text and images using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","status":"active","release_date":"2025-12-07","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/image-to-image","tagline":"Generate images from text and images using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/inpaint/lora","name":"Z Image Turbo Inpaint Lora","created_by":"fal","source":"official","description":"Generate images from text, an image, a mask and custom LoRA using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","status":"active","release_date":"2025-12-18","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/inpaint/lora","tagline":"Generate images from text, an image, a mask and custom LoRA using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/inpaint","name":"Z Image Turbo Inpaint","created_by":"fal","source":"official","description":"Generate images from text, an image and a mask using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","status":"active","release_date":"2025-12-18","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/inpaint","tagline":"Generate images from text, an image and a mask using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/lora","name":"Z Image Turbo Lora","created_by":"fal","source":"official","description":"Text-to-Image endpoint with LoRA support for Z-Image Turbo, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","status":"active","release_date":"2025-12-01","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/lora","tagline":"Text-to-Image endpoint with LoRA support for Z-Image Turbo, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/tiling/lora","name":"Z-Image Turbo Seamless Tiling Lora","created_by":"fal","source":"official","description":"Generate seamlessly tiling photorealistic images from text using Z-Image Turbo and custom LoRA","status":"active","release_date":"2026-03-17","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/tiling/lora","tagline":"Generate seamlessly tiling photorealistic images from text using Z-Image Turbo and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/tiling","name":"Z-Image Turbo Seamless Tiling","created_by":"fal","source":"official","description":"Generate seamlessly tiling photorealistic images from text using Z-Image Turbo","status":"active","release_date":"2026-03-17","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/tiling","tagline":"Generate seamlessly tiling photorealistic images from text using Z-Image Turbo","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/z-image-turbo-trainer-v2","name":"Z Image Turbo Trainer V2","created_by":"fal","source":"official","description":"Fast LoRA trainer for Z-Image-Turbo, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","status":"active","release_date":"2026-01-24","model_type":"other","page_url":"https://fal.run/fal-ai/z-image-turbo-trainer-v2","tagline":"Fast LoRA trainer for Z-Image-Turbo, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/z-image/turbo","name":"Z Image Turbo","created_by":"fal","source":"official","description":"Z-Image Turbo is a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","status":"active","release_date":"2025-11-26","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo","tagline":"Z-Image Turbo is a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-06-03"},{"id":"fal-ai/zonos","name":"Zonos-Audio-Clone","created_by":"fal","source":"official","description":"Clone voice of any person and speak anything in their voice using zonos' voice cloning.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/zonos","tagline":"Clone voice of any person and speak anything in their voice using zonos' voice cloning.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/zonos2","name":"Zonos2 Text to Speech","created_by":"fal","source":"official","description":"Zonos2 is a text-to-speech model that clones a voice from a short sample and speaks naturally across many languages.","status":"active","release_date":"2026-06-16","model_type":"tts","page_url":"https://fal.run/fal-ai/zonos2","tagline":"Zonos2 is a text-to-speech model that clones a voice from a short sample and speaks naturally across many languages.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-16","last_updated":"2026-06-18"},{"id":"ideogram/v4/image-to-image/lora","name":"Ideogram V4.0q Image to Image LoRA","created_by":"ideogram","source":"official","description":"Ideogram V4.0q Image-to-Image LoRA applies a custom-trained LoRA on top of an input image, steering edits toward a specific style, subject, or brand identity while keeping the source composition intac","status":"active","release_date":"2026-06-10","model_type":"image","page_url":"https://fal.run/ideogram/v4/image-to-image/lora","tagline":"Ideogram V4.0q Image-to-Image LoRA applies a custom-trained LoRA on top of an input image, steering edits toward a specific style, subject, or brand identity while keeping the source composition intac","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"ideogram/v4/image-to-image","name":"Ideogram V4.0q Image to Image","created_by":"ideogram","source":"official","description":"Ideogram V4.0q Image-to-Image transforms an input image with a text prompt, restyling and reworking the composition while preserving its core structure for prompt-faithful, high-fidelity edits.","status":"active","release_date":"2026-06-10","model_type":"image","page_url":"https://fal.run/ideogram/v4/image-to-image","tagline":"Ideogram V4.0q Image-to-Image transforms an input image with a text prompt, restyling and reworking the composition while preserving its core structure for prompt-faithful, high-fidelity edits.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"ideogram/v4/lora","name":"Ideogram V4.0q Text to Image (LoRA)","created_by":"ideogram","source":"official","description":"Generate high-quality images, posters, and logos with Ideogram's latest V4.0q using LoRA — producing crisp visuals with accurate text rendering, fine detail, and full creative control for polished, re","status":"active","release_date":"2026-06-08","model_type":"image","page_url":"https://fal.run/ideogram/v4/lora","tagline":"Generate high-quality images, posters, and logos with Ideogram's latest V4.0q using LoRA — producing crisp visuals with accurate text rendering, fine detail, and full creative control for polished, re","capabilities":{"vision":true,"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"ideogram/v4/tiling/lora","name":"Ideogram V4.0q Tiling LoRA","created_by":"ideogram","source":"official","description":"Ideogram V4.0q Tiling LoRA produces seamless repeatable patterns guided by a custom-trained LoRA, locking a specific aesthetic or motif into tileable textures for cohesive, large-scale surface design.","status":"active","release_date":"2026-06-10","model_type":"image","page_url":"https://fal.run/ideogram/v4/tiling/lora","tagline":"Ideogram V4.0q Tiling LoRA produces seamless repeatable patterns guided by a custom-trained LoRA, locking a specific aesthetic or motif into tileable textures for cohesive, large-scale surface design.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"ideogram/v4/tiling","name":"Ideogram V4.0q Tiling","created_by":"ideogram","source":"official","description":"Ideogram V4.0q Tiling generates seamless, edge-matching textures and patterns that repeat infinitely in any direction, ideal for backgrounds, surfaces, and wallpapers.","status":"active","release_date":"2026-06-10","model_type":"image","page_url":"https://fal.run/ideogram/v4/tiling","tagline":"Ideogram V4.0q Tiling generates seamless, edge-matching textures and patterns that repeat infinitely in any direction, ideal for backgrounds, surfaces, and wallpapers.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"ideogram/v4/trainer","name":"Ideogram V4.0q LoRA Trainer","created_by":"ideogram","source":"official","description":"Train custom LoRAs for personalization, styles or other use cases on top of Ideogram V4.","status":"active","release_date":"2026-06-09","model_type":"other","page_url":"https://fal.run/ideogram/v4/trainer","tagline":"Train custom LoRAs for personalization, styles or other use cases on top of Ideogram V4.","last_seen_at":"2026-06-10","last_updated":"2026-06-10"},{"id":"ideogram/v4","name":"Ideogram V4.0 Text to Image","created_by":"ideogram","source":"official","description":"Generate high-quality images, posters, and logos with Ideogram's latest V4.0q — producing crisp visuals with accurate text rendering, fine detail, and full creative control for polished, ready-to-use ","status":"active","release_date":"2026-06-02","model_type":"image","page_url":"https://fal.run/ideogram/v4","tagline":"Generate high-quality images, posters, and logos with Ideogram's latest V4.0q — producing crisp visuals with accurate text rendering, fine detail, and full creative control for polished, ready-to-use ","capabilities":{"vision":true,"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"imagineart/imagineart-1.5-preview/text-to-image","name":"Imagineart 1.5 Preview","created_by":"imagineart","source":"official","description":"ImagineArt 1.5 text-to-image model generates high-fidelity professional-grade visuals with lifelike realism, strong aesthetics, and text that actually reads correctly.","status":"active","release_date":"2025-11-20","model_type":"image","page_url":"https://fal.run/imagineart/imagineart-1.5-preview/text-to-image","tagline":"ImagineArt 1.5 text-to-image model generates high-fidelity professional-grade visuals with lifelike realism, strong aesthetics, and text that actually reads correctly.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"imagineart/imagineart-1.5-pro-preview/text-to-image","name":"ImagineArt 1.5 Pro Preview","created_by":"imagineart","source":"official","description":"ImagineArt 1.5 Pro is an advanced text-to-image model that creates ultra-high-fidelity 4K visuals with lifelike realism, refined aesthetics, and powerful creative output suited for professional use.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/imagineart/imagineart-1.5-pro-preview/text-to-image","tagline":"ImagineArt 1.5 Pro is an advanced text-to-image model that creates ultra-high-fidelity 4K visuals with lifelike realism, refined aesthetics, and powerful creative output suited for professional use.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"imagineart/imagineart-2.0-edit-preview/image-to-image","name":"Imagineart 2.0 Edit Preview","created_by":"imagineart","source":"official","description":"ImagineArt 2.0 Edit delivers precise prompt-guided image editing at 2K resolution, preserving fine detail and realism while accurately applying targeted changes across one or more reference images.","status":"active","release_date":"2026-05-19","model_type":"image","page_url":"https://fal.run/imagineart/imagineart-2.0-edit-preview/image-to-image","tagline":"ImagineArt 2.0 Edit delivers precise prompt-guided image editing at 2K resolution, preserving fine detail and realism while accurately applying targeted changes across one or more reference images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-19","last_updated":"2026-06-03"},{"id":"imagineart/imagineart-2.0-preview/text-to-image","name":"Imagineart 2.0 Preview","created_by":"imagineart","source":"official","description":"ImagineArt 2.0 is ImagineArt's latest state-of-the-art visual reasoning text-to-image model, generating high-fidelity, professional-grade visuals with lifelike realism, cinematic effects, and strong a","status":"active","release_date":"2026-04-13","model_type":"image","page_url":"https://fal.run/imagineart/imagineart-2.0-preview/text-to-image","tagline":"ImagineArt 2.0 is ImagineArt's latest state-of-the-art visual reasoning text-to-image model, generating high-fidelity, professional-grade visuals with lifelike realism, cinematic effects, and strong a","capabilities":{"vision":true,"reasoning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"krea/v2/large/text-to-image","name":"Krea 2 Large","created_by":"krea","source":"official","description":"Generate high-fidelity images from text with Krea 2 Large, supporting aspect ratio, creativity, seed controls, and optional style references.","status":"active","release_date":"2026-05-27","model_type":"image","page_url":"https://fal.run/krea/v2/large/text-to-image","tagline":"Generate high-fidelity images from text with Krea 2 Large, supporting aspect ratio, creativity, seed controls, and optional style references.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-11","last_updated":"2026-06-18"},{"id":"krea/v2/medium/text-to-image","name":"Krea 2 Medium","created_by":"krea","source":"official","description":"Generate high-quality images from text with Krea 2 Medium, supporting aspect ratio, creativity controls, seeds, and optional style references.","status":"active","release_date":"2026-05-27","model_type":"image","page_url":"https://fal.run/krea/v2/medium/text-to-image","tagline":"Generate high-quality images from text with Krea 2 Medium, supporting aspect ratio, creativity controls, seeds, and optional style references.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-29","last_updated":"2026-06-03"},{"id":"krea/v2/medium/turbo/text-to-image","name":"Krea 2 Medium Text to Image Turbo","created_by":"krea","source":"official","description":"Generate high-fidelity images extremely fast from text with Krea 2 Medium Turbo, supporting aspect ratio, creativity, seed controls, and optional style references.","status":"active","release_date":"2026-06-03","model_type":"image","page_url":"https://fal.run/krea/v2/medium/turbo/text-to-image","tagline":"Generate high-fidelity images extremely fast from text with Krea 2 Medium Turbo, supporting aspect ratio, creativity, seed controls, and optional style references.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"luma/agent/ray/v3.2/image-to-video","name":"Luma Ray 3.2 Image to Video","created_by":"luma","source":"official","description":"Luma Ray 3.2 animates a source image into cinematic motion guided by a text prompt, preserving the starting frame's look while controlling resolution, duration, and seamless looping.","status":"active","release_date":"2026-06-09","model_type":"video","page_url":"https://fal.run/luma/agent/ray/v3.2/image-to-video","tagline":"Luma Ray 3.2 animates a source image into cinematic motion guided by a text prompt, preserving the starting frame's look while controlling resolution, duration, and seamless looping.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"luma/agent/ray/v3.2/reframe","name":"Luma Ray 3.2 Reframe","created_by":"luma","source":"official","description":"Luma Ray 3.2 reframes an existing video into a new aspect ratio guided by a text prompt, preserving the original footage frame-for-frame while controlling resolution and outpainting the surrounding ca","status":"active","release_date":"2026-06-11","model_type":"other","page_url":"https://fal.run/luma/agent/ray/v3.2/reframe","tagline":"Luma Ray 3.2 reframes an existing video into a new aspect ratio guided by a text prompt, preserving the original footage frame-for-frame while controlling resolution and outpainting the surrounding ca","last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"luma/agent/ray/v3.2/text-to-video","name":"Luma Ray 3.2 Text to Video","created_by":"luma","source":"official","description":"Luma Ray 3.2 generates cinematic video from a text prompt, with control over resolution, duration, and seamless looping, plus reference images to lock in subject and style.","status":"active","release_date":"2026-06-09","model_type":"video","page_url":"https://fal.run/luma/agent/ray/v3.2/text-to-video","tagline":"Luma Ray 3.2 generates cinematic video from a text prompt, with control over resolution, duration, and seamless looping, plus reference images to lock in subject and style.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"luma/agent/ray/v3.2/video-to-video","name":"Luma Ray 3.2 Video to Video","created_by":"luma","source":"official","description":"Luma Ray 3.2 re-renders an existing video into new cinematic motion guided by a text prompt, preserving the source's look and movement while controlling resolution, duration, and HDR.","status":"active","release_date":"2026-06-11","model_type":"other","page_url":"https://fal.run/luma/agent/ray/v3.2/video-to-video","tagline":"Luma Ray 3.2 re-renders an existing video into new cinematic motion guided by a text prompt, preserving the source's look and movement while controlling resolution, duration, and HDR.","last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"luma/agent/uni-1/v1/edit","name":"Luma Uni-1 Edit","created_by":"luma","source":"official","description":"Luma Uni-1 Edit reworks a source image from a text instruction, preserving the original composition while applying style changes and following optional reference images to steer the result.","status":"active","release_date":"2026-06-09","model_type":"image","page_url":"https://fal.run/luma/agent/uni-1/v1/edit","tagline":"Luma Uni-1 Edit reworks a source image from a text instruction, preserving the original composition while applying style changes and following optional reference images to steer the result.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"luma/agent/uni-1/v1/max/edit","name":"Luma Uni-1 Edit Max","created_by":"luma","source":"official","description":"Luma Uni-1 Max Edit applies text-guided edits to a source image at maximum fidelity, holding the original structure while honoring reference images for precise, high-detail revisions.","status":"active","release_date":"2026-06-09","model_type":"image","page_url":"https://fal.run/luma/agent/uni-1/v1/max/edit","tagline":"Luma Uni-1 Max Edit applies text-guided edits to a source image at maximum fidelity, holding the original structure while honoring reference images for precise, high-detail revisions.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"luma/agent/uni-1/v1/max","name":"Luma Uni-1 Text to Image Max","created_by":"luma","source":"official","description":"Luma Uni-1 Max generates a single image at the model's highest fidelity, delivering richer detail and stronger prompt adherence than the base tier for hero-quality stills.","status":"active","release_date":"2026-06-09","model_type":"image","page_url":"https://fal.run/luma/agent/uni-1/v1/max","tagline":"Luma Uni-1 Max generates a single image at the model's highest fidelity, delivering richer detail and stronger prompt adherence than the base tier for hero-quality stills.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"luma/agent/uni-1/v1/text-to-image","name":"Luma Uni-1 Text to Image","created_by":"luma","source":"official","description":"Luma Uni-1 turns a text prompt into a single high-fidelity image, with control over aspect ratio and visual style, plus optional web-sourced and reference-image guidance for sharper grounding.","status":"active","release_date":"2026-06-09","model_type":"image","page_url":"https://fal.run/luma/agent/uni-1/v1/text-to-image","tagline":"Luma Uni-1 turns a text prompt into a single high-fidelity image, with control over aspect ratio and visual style, plus optional web-sourced and reference-image guidance for sharper grounding.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"microsoft/mai-image-2.5/edit","name":"Mai Image 2.5","created_by":"microsoft","source":"official","description":"MAI-Image-2.5 is Microsoft's photorealistic image generation and editing model that turns text prompts or uploaded images into high-quality, design-ready visuals with fine-grained, pixel-level control","status":"active","release_date":"2026-06-03","model_type":"image","page_url":"https://fal.run/microsoft/mai-image-2.5/edit","tagline":"MAI-Image-2.5 is Microsoft's photorealistic image generation and editing model that turns text prompts or uploaded images into high-quality, design-ready visuals with fine-grained, pixel-level control","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-04","last_updated":"2026-06-10"},{"id":"microsoft/mai-image-2.5","name":"Mai Image 2.5 Text to Image","created_by":"microsoft","source":"official","description":"MAI-Image-2.5 is Microsoft's photorealistic image generation and editing model that turns text prompts or uploaded images into high-quality, design-ready visuals with fine-grained, pixel-level control","status":"active","release_date":"2026-06-02","model_type":"image","page_url":"https://fal.run/microsoft/mai-image-2.5","tagline":"MAI-Image-2.5 is Microsoft's photorealistic image generation and editing model that turns text prompts or uploaded images into high-quality, design-ready visuals with fine-grained, pixel-level control","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"mirelo-ai/sfx-v1/video-to-audio","name":"Mirelo SFX","created_by":"mirelo-ai","source":"official","description":"Generate synced sounds for any video, and return the new sound track (like MMAudio)","status":"active","release_date":"2025-08-15","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx-v1/video-to-audio","tagline":"Generate synced sounds for any video, and return the new sound track (like MMAudio)","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"mirelo-ai/sfx-v1/video-to-video","name":"Mirelo SFX","created_by":"mirelo-ai","source":"official","description":"Generate synced sounds for any video, and return it with its new sound track (like MMAudio)\n","status":"active","release_date":"2025-08-14","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx-v1/video-to-video","tagline":"Generate synced sounds for any video, and return it with its new sound track (like MMAudio)\n","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"mirelo-ai/sfx-v1.5/video-to-audio","name":"Mirelo SFX V1.5","created_by":"mirelo-ai","source":"official","description":"Generate synced sounds for any video, and return the new sound track (like MMAudio)","status":"active","release_date":"2025-10-15","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx-v1.5/video-to-audio","tagline":"Generate synced sounds for any video, and return the new sound track (like MMAudio)","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"mirelo-ai/sfx-v1.5/video-to-video","name":"Mirelo SFX V1.5","created_by":"mirelo-ai","source":"official","description":"Generate synced sounds for any video, and return it with its new sound track (like MMAudio)","status":"active","release_date":"2025-10-15","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx-v1.5/video-to-video","tagline":"Generate synced sounds for any video, and return it with its new sound track (like MMAudio)","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"mirelo-ai/sfx1.6/extend-audio","name":"Mirelo SFX1.6","created_by":"mirelo-ai","source":"official","description":"Extend any sound effect with seamless, natural tails.","status":"active","release_date":"2026-05-18","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx1.6/extend-audio","tagline":"Extend any sound effect with seamless, natural tails.","last_seen_at":"2026-05-19","last_updated":"2026-06-03"},{"id":"mirelo-ai/sfx1.6/inpaint-audio","name":"Mirelo SFX1.6","created_by":"mirelo-ai","source":"official","description":"Erase and replace any moment in your audio with AI-driven precision.","status":"active","release_date":"2026-05-18","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx1.6/inpaint-audio","tagline":"Erase and replace any moment in your audio with AI-driven precision.","last_seen_at":"2026-05-19","last_updated":"2026-06-03"},{"id":"mirelo-ai/sfx1.6/text-to-audio","name":"Mirelo SFX1.6","created_by":"mirelo-ai","source":"official","description":"Generate ambient sounds for any text prompt.","status":"active","release_date":"2026-05-15","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx1.6/text-to-audio","tagline":"Generate ambient sounds for any text prompt.","last_seen_at":"2026-05-19","last_updated":"2026-06-03"},{"id":"mirelo-ai/sfx1.6/video-to-video","name":"Mirelo SFX1.6","created_by":"mirelo-ai","source":"official","description":"Generate synced sounds for any video, and return it with its new sound track (like MMAudio).","status":"active","release_date":"2026-05-18","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx1.6/video-to-video","tagline":"Generate synced sounds for any video, and return it with its new sound track (like MMAudio).","last_seen_at":"2026-05-19","last_updated":"2026-06-03"},{"id":"moonvalley/marey/i2v","name":"Marey Realism V1.5","created_by":"moonvalley","source":"official","description":"Generate a video starting from an image as the first frame with Marey, a generative video model trained exclusively on fully licensed data.","status":"active","release_date":"2025-08-14","model_type":"video","page_url":"https://fal.run/moonvalley/marey/i2v","tagline":"Generate a video starting from an image as the first frame with Marey, a generative video model trained exclusively on fully licensed data.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"moonvalley/marey/motion-transfer","name":"Marey Realism V1.5","created_by":"moonvalley","source":"official","description":"Pull motion from a reference video and apply it to new subjects or scenes.","status":"active","release_date":"2025-08-14","model_type":"other","page_url":"https://fal.run/moonvalley/marey/motion-transfer","tagline":"Pull motion from a reference video and apply it to new subjects or scenes.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"moonvalley/marey/pose-transfer","name":"Marey Realism V1.5","created_by":"moonvalley","source":"official","description":"Ideal for matching human movement.","status":"active","release_date":"2025-08-14","model_type":"other","page_url":"https://fal.run/moonvalley/marey/pose-transfer","tagline":"Ideal for matching human movement.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"moonvalley/marey/t2v","name":"Marey Realism V1.5","created_by":"moonvalley","source":"official","description":"Generate a video from a text prompt with Marey, a generative video model trained exclusively on fully licensed data.","status":"active","release_date":"2025-08-14","model_type":"video","page_url":"https://fal.run/moonvalley/marey/t2v","tagline":"Generate a video from a text prompt with Marey, a generative video model trained exclusively on fully licensed data.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"nvidia/cosmos-3-super/image-to-video","name":"Cosmos 3 Super Image to Video","created_by":"nvidia","source":"official","description":"Cosmos3 is a collection of Omnimodal world models capable of generating dynamic, high-quality video, image, audio, and action commands from combinations of text, image, video, and action trajectory in","status":"active","release_date":"2026-06-01","model_type":"video","page_url":"https://fal.run/nvidia/cosmos-3-super/image-to-video","tagline":"Cosmos3 is a collection of Omnimodal world models capable of generating dynamic, high-quality video, image, audio, and action commands from combinations of text, image, video, and action trajectory in","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-02","last_updated":"2026-06-03"},{"id":"nvidia/cosmos-3-super/text-to-image","name":"Cosmos 3 Super","created_by":"nvidia","source":"official","description":"Cosmos3 is a collection of Omnimodal world models capable of generating dynamic, high-quality video, image, audio, and action commands from combinations of text, image, video, and action trajectory in","status":"active","release_date":"2026-06-01","model_type":"image","page_url":"https://fal.run/nvidia/cosmos-3-super/text-to-image","tagline":"Cosmos3 is a collection of Omnimodal world models capable of generating dynamic, high-quality video, image, audio, and action commands from combinations of text, image, video, and action trajectory in","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-02","last_updated":"2026-06-03"},{"id":"nvidia/nemotron-3-nano-omni/audio","name":"Nemotron 3 Nano Omni","created_by":"nvidia","source":"official","description":"Audio reasoning variant of NVIDIA's Nemotron 3 Nano Omni.","status":"active","release_date":"2026-04-27","model_type":"transcription","page_url":"https://fal.run/nvidia/nemotron-3-nano-omni/audio","tagline":"Audio reasoning variant of NVIDIA's Nemotron 3 Nano Omni.","capabilities":{"reasoning":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-04-30","last_updated":"2026-05-11"},{"id":"nvidia/nemotron-3-nano-omni/video","name":"Nemotron 3 Nano Omni","created_by":"nvidia","source":"official","description":"Video reasoning variant of NVIDIA's Nemotron 3 Nano Omni.","status":"active","release_date":"2026-04-27","model_type":"other","page_url":"https://fal.run/nvidia/nemotron-3-nano-omni/video","tagline":"Video reasoning variant of NVIDIA's Nemotron 3 Nano Omni.","capabilities":{"reasoning":true},"last_seen_at":"2026-05-13","last_updated":"2026-06-03"},{"id":"nvidia/nemotron-3-nano-omni/vision","name":"Nemotron 3 Nano Omni","created_by":"nvidia","source":"official","description":"Vision reasoning variant of NVIDIA's Nemotron 3 Nano Omni.","status":"active","release_date":"2026-04-27","model_type":"other","page_url":"https://fal.run/nvidia/nemotron-3-nano-omni/vision","tagline":"Vision reasoning variant of NVIDIA's Nemotron 3 Nano Omni.","capabilities":{"vision":true,"reasoning":true},"last_seen_at":"2026-04-30","last_updated":"2026-05-11"},{"id":"nvidia/nemotron-3-nano-omni","name":"Nemotron 3 Nano Omni","created_by":"nvidia","source":"official","description":"Open, efficient reasoning model from NVIDIA.","status":"active","release_date":"2026-04-27","model_type":"other","page_url":"https://fal.run/nvidia/nemotron-3-nano-omni","tagline":"Open, efficient reasoning model from NVIDIA.","capabilities":{"reasoning":true},"last_seen_at":"2026-04-30","last_updated":"2026-05-11"},{"id":"nvidia/nemotron-asr-multilingual/asr","name":"Nemotron Asr Multilingual","created_by":"nvidia","source":"official","description":"Nemotron-ASR-Streaming is a multi lingual, streaming Automatic Speech Recognition (ASR) engineered to deliver high-quality multi lingual transcription across both low-latency streaming and high-throug","status":"active","release_date":"2026-06-01","model_type":"transcription","page_url":"https://fal.run/nvidia/nemotron-asr-multilingual/asr","tagline":"Nemotron-ASR-Streaming is a multi lingual, streaming Automatic Speech Recognition (ASR) engineered to deliver high-quality multi lingual transcription across both low-latency streaming and high-throug","capabilities":{"streaming":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-06-10","last_updated":"2026-06-18"},{"id":"openai/gpt-image-2/edit","name":"GPT Image 2 API","created_by":"openai","source":"official","family":"gpt-image-2","description":"GPT Image 2, OpenAI's latest image model, is capable of making fine-grained, detailed edits to images.","status":"active","release_date":"2026-04-20","model_type":"image","page_url":"https://fal.run/openai/gpt-image-2/edit","tagline":"GPT Image 2, OpenAI's latest image model, is capable of making fine-grained, detailed edits to images.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-02","last_updated":"2026-06-03"},{"id":"openai/gpt-image-2","name":"GPT Image 2 API","created_by":"openai","source":"official","family":"gpt-image-2","description":"GPT Image 2, OpenAI's latest image model, is capable of creating extremely detailed images with fine typography.","status":"active","release_date":"2026-04-20","model_type":"image","page_url":"https://fal.run/openai/gpt-image-2","tagline":"GPT Image 2, OpenAI's latest image model, is capable of creating extremely detailed images with fine typography.","capabilities":{"streaming":true,"vision":true,"tool_call":false,"structured_output":false,"json_mode":false,"fine_tuning":false,"reasoning":false,"batch":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-11","last_updated":"2026-06-18","license":"proprietary","open_weight":false},{"id":"openrouter/router/audio","name":"OpenRouter [Audio]","created_by":"openrouter","source":"official","description":" Run any audio capable LLM with fal.","status":"active","release_date":"2025-12-22","model_type":"other","page_url":"https://fal.run/openrouter/router/audio","tagline":" Run any audio capable LLM with fal.","last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"openrouter/router/enterprise","name":"OpenRouter [Enterprise]","created_by":"openrouter","source":"official","description":"Run any LLM (Large Language Model) with fal, powered by OpenRouter.","status":"active","release_date":"2025-12-22","model_type":"other","page_url":"https://fal.run/openrouter/router/enterprise","tagline":"Run any LLM (Large Language Model) with fal, powered by OpenRouter.","capabilities":{"streaming":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"openrouter/router/openai/v1/chat/completions","name":"OpenRouter Chat Completions [OpenAI Compatible]","created_by":"openrouter","source":"official","description":"OpenAI-compatible chat completions API.","status":"active","release_date":"2025-11-12","model_type":"other","page_url":"https://fal.run/openrouter/router/openai/v1/chat/completions","tagline":"OpenAI-compatible chat completions API.","last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"openrouter/router/openai/v1/embeddings","name":"OpenRouter Embeddings [OpenAI Compatible]","created_by":"openrouter","source":"official","description":"Generate text embeddings using OpenAI-compatible API.","status":"active","release_date":"2025-11-12","model_type":"other","page_url":"https://fal.run/openrouter/router/openai/v1/embeddings","tagline":"Generate text embeddings using OpenAI-compatible API.","last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"openrouter/router/openai/v1/responses","name":"OpenRouter Responses [OpenAI Compatible]","created_by":"openrouter","source":"official","description":"The OpenRouter Responses API with fal, powered by OpenRouter, provides unified access to a wide range of large language models - including GPT, Claude, Gemini, and many others through a single API int","status":"active","release_date":"2025-11-13","model_type":"other","page_url":"https://fal.run/openrouter/router/openai/v1/responses","tagline":"The OpenRouter Responses API with fal, powered by OpenRouter, provides unified access to a wide range of large language models - including GPT, Claude, Gemini, and many others through a single API int","last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"openrouter/router/video/enterprise","name":"OpenRouter [Video][Enterprise]","created_by":"openrouter","source":"official","description":"Run any VLM (Video Language Model) with fal, powered by OpenRouter.","status":"active","release_date":"2026-01-13","model_type":"other","page_url":"https://fal.run/openrouter/router/video/enterprise","tagline":"Run any VLM (Video Language Model) with fal, powered by OpenRouter.","capabilities":{"streaming":true},"last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"openrouter/router/video","name":"OpenRouter [Video]","created_by":"openrouter","source":"official","description":"Run any video-capable LLM with fal.","status":"active","release_date":"2026-01-13","model_type":"other","page_url":"https://fal.run/openrouter/router/video","tagline":"Run any video-capable LLM with fal.","capabilities":{"streaming":true},"last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"openrouter/router/vision","name":"OpenRouter [Vision]","created_by":"openrouter","source":"official","description":"Run any Vision Language Model with fal.","status":"active","release_date":"2025-11-12","model_type":"other","page_url":"https://fal.run/openrouter/router/vision","tagline":"Run any Vision Language Model with fal.","capabilities":{"streaming":true,"vision":true},"last_seen_at":"2026-06-26","last_updated":"2026-06-29"},{"id":"openrouter/router","name":"OpenRouter","created_by":"openrouter","source":"official","description":"Run any LLM with fal.","status":"active","release_date":"2025-11-12","model_type":"other","page_url":"https://fal.run/openrouter/router","tagline":"Run any LLM with fal.","capabilities":{"streaming":true,"reasoning":true,"structured_output":true,"json_mode":true},"last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"perceptron/isaac-01/openai/v1/chat/completions","name":"Isaac 0.1 [OpenAI Compatible Endpoint]","created_by":"perceptron","source":"official","description":"OpenAI spec compatible endpoint of Isaac-01 which is a multimodal vision-language model from Perceptron for various vision language tasks.","status":"active","release_date":"2025-09-17","model_type":"other","page_url":"https://fal.run/perceptron/isaac-01/openai/v1/chat/completions","tagline":"OpenAI spec compatible endpoint of Isaac-01 which is a multimodal vision-language model from Perceptron for various vision language tasks.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"perceptron/isaac-01","name":"Isaac 0.1","created_by":"perceptron","source":"official","description":"Isaac-01 is a multimodal vision-language model from Perceptron for various vision language tasks.","status":"active","release_date":"2025-09-17","model_type":"other","page_url":"https://fal.run/perceptron/isaac-01","tagline":"Isaac-01 is a multimodal vision-language model from Perceptron for various vision language tasks.","capabilities":{"streaming":true,"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"pixelcut/background-removal","name":"Pixelcut Background Remover","created_by":"pixelcut","source":"official","description":"Pixelcut’s Background Remover enables fast, ultra high-quality removal of backgrounds from images.","status":"active","release_date":"2026-03-04","model_type":"image","page_url":"https://fal.run/pixelcut/background-removal","tagline":"Pixelcut’s Background Remover enables fast, ultra high-quality removal of backgrounds from images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-11","last_updated":"2026-06-18"},{"id":"pixelcut/video-background-removal","name":"Pixelcut Video Background Removal","created_by":"pixelcut","source":"official","description":"Pixelcut's Video Background Remover is an AI segmentation model that erases backgrounds frame by frame, with seamless temporal consistency.","status":"active","release_date":"2026-06-11","model_type":"other","page_url":"https://fal.run/pixelcut/video-background-removal","tagline":"Pixelcut's Video Background Remover is an AI segmentation model that erases backgrounds frame by frame, with seamless temporal consistency.","last_seen_at":"2026-06-12","last_updated":"2026-06-18"},{"id":"resemble-ai/chatterboxhd/speech-to-speech","name":"Chatterboxhd","created_by":"resemble-ai","source":"official","description":"Transform voices using Resemble AI's Chatterbox.","status":"active","release_date":"2025-06-02","model_type":"other","page_url":"https://fal.run/resemble-ai/chatterboxhd/speech-to-speech","tagline":"Transform voices using Resemble AI's Chatterbox.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"resemble-ai/chatterboxhd/text-to-speech","name":"Chatterboxhd","created_by":"resemble-ai","source":"official","description":"Generate expressive, natural speech with Resemble AI's Chatterbox.","status":"active","release_date":"2025-06-02","model_type":"tts","page_url":"https://fal.run/resemble-ai/chatterboxhd/text-to-speech","tagline":"Generate expressive, natural speech with Resemble AI's Chatterbox.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/juggernaut-flux/base/image-to-image","name":"Juggernaut Flux Base","created_by":"rundiffusion-fal","source":"official","description":"Juggernaut Base Flux by RunDiffusion is a drop-in replacement for Flux [Dev] that delivers sharper details, richer colors, and enhanced realism, while instantly boosting LoRAs and LyCORIS with full co","status":"active","release_date":"2025-03-05","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/juggernaut-flux/base/image-to-image","tagline":"Juggernaut Base Flux by RunDiffusion is a drop-in replacement for Flux [Dev] that delivers sharper details, richer colors, and enhanced realism, while instantly boosting LoRAs and LyCORIS with full co","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/juggernaut-flux/base","name":"Juggernaut Flux Base","created_by":"rundiffusion-fal","source":"official","description":"Juggernaut Base Flux by RunDiffusion is a drop-in replacement for Flux [Dev] that delivers sharper details, richer colors, and enhanced realism, while instantly boosting LoRAs and LyCORIS with full co","status":"active","release_date":"2025-03-05","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/juggernaut-flux/base","tagline":"Juggernaut Base Flux by RunDiffusion is a drop-in replacement for Flux [Dev] that delivers sharper details, richer colors, and enhanced realism, while instantly boosting LoRAs and LyCORIS with full co","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/juggernaut-flux/lightning","name":"Juggernaut Flux Lightning","created_by":"rundiffusion-fal","source":"official","description":"Juggernaut Lightning Flux by RunDiffusion provides blazing-fast, high-quality images rendered at five times the speed of Flux.","status":"active","release_date":"2025-03-05","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/juggernaut-flux/lightning","tagline":"Juggernaut Lightning Flux by RunDiffusion provides blazing-fast, high-quality images rendered at five times the speed of Flux.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/juggernaut-flux-lora/inpainting","name":"Juggernaut Flux Lora","created_by":"rundiffusion-fal","source":"official","description":"Juggernaut Base Flux LoRA Inpainting by RunDiffusion is a drop-in replacement for Flux [Dev] inpainting that delivers sharper details, richer colors, and enhanced realism to all your LoRAs and LyCORIS","status":"active","release_date":"2025-04-21","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/juggernaut-flux-lora/inpainting","tagline":"Juggernaut Base Flux LoRA Inpainting by RunDiffusion is a drop-in replacement for Flux [Dev] inpainting that delivers sharper details, richer colors, and enhanced realism to all your LoRAs and LyCORIS","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/juggernaut-flux-lora","name":"Juggernaut Flux Base LoRA","created_by":"rundiffusion-fal","source":"official","description":"Juggernaut Base Flux LoRA by RunDiffusion is a drop-in replacement for Flux [Dev] that delivers sharper details, richer colors, and enhanced realism to all your LoRAs and LyCORIS with full compatibili","status":"active","release_date":"2025-03-05","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/juggernaut-flux-lora","tagline":"Juggernaut Base Flux LoRA by RunDiffusion is a drop-in replacement for Flux [Dev] that delivers sharper details, richer colors, and enhanced realism to all your LoRAs and LyCORIS with full compatibili","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/juggernaut-flux/pro/image-to-image","name":"Juggernaut Flux Pro","created_by":"rundiffusion-fal","source":"official","description":"Juggernaut Pro Flux by RunDiffusion is the flagship Juggernaut model rivaling some of the most advanced image models available, often surpassing them in realism.","status":"active","release_date":"2025-03-05","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/juggernaut-flux/pro/image-to-image","tagline":"Juggernaut Pro Flux by RunDiffusion is the flagship Juggernaut model rivaling some of the most advanced image models available, often surpassing them in realism.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/juggernaut-flux/pro","name":"Juggernaut Flux Pro","created_by":"rundiffusion-fal","source":"official","description":"Juggernaut Pro Flux by RunDiffusion is the flagship Juggernaut model rivaling some of the most advanced image models available, often surpassing them in realism.","status":"active","release_date":"2025-03-05","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/juggernaut-flux/pro","tagline":"Juggernaut Pro Flux by RunDiffusion is the flagship Juggernaut model rivaling some of the most advanced image models available, often surpassing them in realism.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/rundiffusion-photo-flux","name":"Rundiffusion Photo Flux","created_by":"rundiffusion-fal","source":"official","description":"RunDiffusion Photo Flux provides insane realism.","status":"active","release_date":"2025-03-05","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/rundiffusion-photo-flux","tagline":"RunDiffusion Photo Flux provides insane realism.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"smoretalk-ai/rembg-enhance","name":"Rembg Enhance (Remove Background Enhance)","created_by":"smoretalk-ai","source":"official","description":"Rembg-enhance is optimized for 2D vector images, 3D graphics, and photos by leveraging matting technology.","status":"active","release_date":"2025-05-09","model_type":"image","page_url":"https://fal.run/smoretalk-ai/rembg-enhance","tagline":"Rembg-enhance is optimized for 2D vector images, 3D graphics, and photos by leveraging matting technology.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-13","last_updated":"2026-06-03"},{"id":"sonauto/v2/extend","name":"Sonauto V2","created_by":"sonauto","source":"official","description":"Extend an existing song","status":"active","release_date":"2025-08-23","model_type":"other","page_url":"https://fal.run/sonauto/v2/extend","tagline":"Extend an existing song","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"sonauto/v2/inpaint","name":"Sonauto V2","created_by":"sonauto","source":"official","description":"Replace sections of an existing audio with newly generated content","status":"active","release_date":"2025-08-23","model_type":"other","page_url":"https://fal.run/sonauto/v2/inpaint","tagline":"Replace sections of an existing audio with newly generated content","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"sonauto/v2/text-to-music","name":"Sonauto V2","created_by":"sonauto","source":"official","description":"Create full songs in any style","status":"active","release_date":"2025-08-23","model_type":"other","page_url":"https://fal.run/sonauto/v2/text-to-music","tagline":"Create full songs in any style","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"sonilo/v1.1/text-to-music","name":"Sonilo V1.1 Text to Music","created_by":"sonilo","source":"official","description":"Generates production-ready music from a single text prompt, with full control over style, mood, instrumentation, and exact duration.","status":"active","release_date":"2026-06-03","model_type":"other","page_url":"https://fal.run/sonilo/v1.1/text-to-music","tagline":"Generates production-ready music from a single text prompt, with full control over style, mood, instrumentation, and exact duration.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"sonilo/v1.1/video-to-music","name":"V1.1","created_by":"sonilo","source":"official","description":"Analyzes your video's pacing, mood, and timing to generate a frame-synced, commercial-ready soundtrack in seconds","status":"active","release_date":"2026-06-03","model_type":"other","page_url":"https://fal.run/sonilo/v1.1/video-to-music","tagline":"Analyzes your video's pacing, mood, and timing to generate a frame-synced, commercial-ready soundtrack in seconds","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"tripo3d/h3.1/image-to-3d","name":"Tripo H3.1 Image to 3D","created_by":"tripo3d","source":"official","description":"Generate high-quality 3D models from a single image using Tripo H3.1.","status":"active","release_date":"2026-04-07","model_type":"other","page_url":"https://fal.run/tripo3d/h3.1/image-to-3d","tagline":"Generate high-quality 3D models from a single image using Tripo H3.1.","capabilities":{"vision":true},"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"tripo3d/h3.1/multiview-to-3d","name":"Tripo H3.1 Multiview to 3D","created_by":"tripo3d","source":"official","description":"Generate 3D models from multiple view images using Tripo H3.1.","status":"active","release_date":"2026-04-07","model_type":"other","page_url":"https://fal.run/tripo3d/h3.1/multiview-to-3d","tagline":"Generate 3D models from multiple view images using Tripo H3.1.","capabilities":{"vision":true},"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"tripo3d/h3.1/text-to-3d","name":"Tripo H3.1 Text to 3D","created_by":"tripo3d","source":"official","description":"Generate 3D models from text descriptions using Tripo H3.1.","status":"active","release_date":"2026-04-07","model_type":"other","page_url":"https://fal.run/tripo3d/h3.1/text-to-3d","tagline":"Generate 3D models from text descriptions using Tripo H3.1.","last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"tripo3d/p1/image-to-3d","name":"Tripo P1 Image to 3D","created_by":"tripo3d","source":"official","description":"Generate 3D models from a single image using Tripo P1.","status":"active","release_date":"2026-04-07","model_type":"other","page_url":"https://fal.run/tripo3d/p1/image-to-3d","tagline":"Generate 3D models from a single image using Tripo P1.","capabilities":{"vision":true},"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"tripo3d/p1/text-to-3d","name":"Tripo P1 Text to 3D","created_by":"tripo3d","source":"official","description":"Generate 3D models from text descriptions using Tripo P1.","status":"active","release_date":"2026-04-07","model_type":"other","page_url":"https://fal.run/tripo3d/p1/text-to-3d","tagline":"Generate 3D models from text descriptions using Tripo P1.","last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"tripo3d/tripo/v2.5/image-to-3d","name":"Tripo3D","created_by":"tripo3d","source":"official","description":"State of the art Image to 3D Object generation.","status":"active","release_date":"2025-04-25","model_type":"other","page_url":"https://fal.run/tripo3d/tripo/v2.5/image-to-3d","tagline":"State of the art Image to 3D Object generation.","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"tripo3d/tripo/v2.5/multiview-to-3d","name":"Tripo3D","created_by":"tripo3d","source":"official","description":"State of the art Multiview to 3D Object generation.","status":"active","release_date":"2025-06-18","model_type":"other","page_url":"https://fal.run/tripo3d/tripo/v2.5/multiview-to-3d","tagline":"State of the art Multiview to 3D Object generation.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"tripo3d/triposplat","name":"Triposplat","created_by":"tripo3d","source":"official","description":"TripoSplat is an open-source model from TripoAI / VAST AI Research that converts a single 2D image into high-quality 3D Gaussians using a novel learned density-control approach","status":"active","release_date":"2026-06-03","model_type":"other","page_url":"https://fal.run/tripo3d/triposplat","tagline":"TripoSplat is an open-source model from TripoAI / VAST AI Research that converts a single 2D image into high-quality 3D Gaussians using a novel learned density-control approach","capabilities":{"vision":true},"last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"veed/avatars/audio-to-video","name":"Avatars","created_by":"veed","source":"official","description":"Generate high-quality videos with UGC-like avatars from audio","status":"active","release_date":"2025-05-28","model_type":"other","page_url":"https://fal.run/veed/avatars/audio-to-video","tagline":"Generate high-quality videos with UGC-like avatars from audio","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"veed/avatars/text-to-video","name":"Avatars","created_by":"veed","source":"official","description":"Generate high-quality videos with UGC-like avatars from text","status":"active","release_date":"2025-05-28","model_type":"video","page_url":"https://fal.run/veed/avatars/text-to-video","tagline":"Generate high-quality videos with UGC-like avatars from text","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"veed/fabric-1.0/fast","name":"Fabric 1.0 Fast","created_by":"veed","source":"official","description":"VEED Fabric 1.0 is an image-to-video API that turns any image into a talking video","status":"active","release_date":"2025-10-01","model_type":"video","page_url":"https://fal.run/veed/fabric-1.0/fast","tagline":"VEED Fabric 1.0 is an image-to-video API that turns any image into a talking video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-23","last_updated":"2026-05-11"},{"id":"veed/fabric-1.0/text","name":"Fabric 1.0","created_by":"veed","source":"official","description":"VEED Fabric 1.0 text-to-video API","status":"active","release_date":"2025-12-12","model_type":"video","page_url":"https://fal.run/veed/fabric-1.0/text","tagline":"VEED Fabric 1.0 text-to-video API","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-23","last_updated":"2026-05-11"},{"id":"veed/fabric-1.0","name":"Fabric 1.0","created_by":"veed","source":"official","description":"VEED Fabric 1.0 is an image-to-video API that turns any image into a talking video","status":"active","release_date":"2025-09-19","model_type":"video","page_url":"https://fal.run/veed/fabric-1.0","tagline":"VEED Fabric 1.0 is an image-to-video API that turns any image into a talking video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-23","last_updated":"2026-05-11"},{"id":"veed/lipsync","name":"Lipsync","created_by":"veed","source":"official","description":"Generate realistic lipsync from any audio using VEED's latest model","status":"active","release_date":"2025-05-28","model_type":"other","page_url":"https://fal.run/veed/lipsync","tagline":"Generate realistic lipsync from any audio using VEED's latest model","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"veed/subtitles","name":"Subtitles","created_by":"veed","source":"official","description":"VEED’s Subtitles API transforms raw footage into polished, publish-ready content with professional burned-in subtitles starting at a base rate of $0.10 per minute.","status":"active","release_date":"2026-05-11","model_type":"other","page_url":"https://fal.run/veed/subtitles","tagline":"VEED’s Subtitles API transforms raw footage into polished, publish-ready content with professional burned-in subtitles starting at a base rate of $0.10 per minute.","last_seen_at":"2026-06-11","last_updated":"2026-06-18"},{"id":"veed/video-background-removal/fast","name":"Video Background Removal","created_by":"veed","source":"official","description":"Remove background from any video with people and objects.","status":"active","release_date":"2025-12-01","model_type":"other","page_url":"https://fal.run/veed/video-background-removal/fast","tagline":"Remove background from any video with people and objects.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"veed/video-background-removal/green-screen","name":"Video Background Removal","created_by":"veed","source":"official","description":"Remove background from videos filmed using chromakey, with automatic green spill suppression for clean, professional edges.","status":"active","release_date":"2025-11-28","model_type":"other","page_url":"https://fal.run/veed/video-background-removal/green-screen","tagline":"Remove background from videos filmed using chromakey, with automatic green spill suppression for clean, professional edges.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"veed/video-background-removal","name":"Video Background Removal","created_by":"veed","source":"official","description":"Remove background from any video with people and objects.","status":"active","release_date":"2025-11-28","model_type":"other","page_url":"https://fal.run/veed/video-background-removal","tagline":"Remove background from any video with people and objects.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"wan/v2.6/image-to-image","name":"Wan v2.6 Image to Image","created_by":"wan","source":"official","description":"Wan 2.6 image-to-image model.","status":"active","release_date":"2025-12-23","model_type":"image","page_url":"https://fal.run/wan/v2.6/image-to-image","tagline":"Wan 2.6 image-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"wan/v2.6/image-to-video/flash","name":"V2.6","created_by":"wan","source":"official","description":"Wan 2.6 image-to-video flash model.","status":"active","release_date":"2026-01-18","model_type":"video","page_url":"https://fal.run/wan/v2.6/image-to-video/flash","tagline":"Wan 2.6 image-to-video flash model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"wan/v2.6/image-to-video","name":"Wan v2.6 Image to Video","created_by":"wan","source":"official","description":"Wan 2.6 image-to-video model.","status":"active","release_date":"2025-12-15","model_type":"video","page_url":"https://fal.run/wan/v2.6/image-to-video","tagline":"Wan 2.6 image-to-video model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"wan/v2.6/reference-to-video/flash","name":"V2.6","created_by":"wan","source":"official","description":"Wan 2.6 reference-to-video flash model.","status":"active","release_date":"2026-02-06","model_type":"other","page_url":"https://fal.run/wan/v2.6/reference-to-video/flash","tagline":"Wan 2.6 reference-to-video flash model.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"wan/v2.6/reference-to-video","name":"Wan v2.6 Reference to Video","created_by":"wan","source":"official","description":"Wan 2.6 reference-to-video model.","status":"active","release_date":"2025-12-16","model_type":"other","page_url":"https://fal.run/wan/v2.6/reference-to-video","tagline":"Wan 2.6 reference-to-video model.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"wan/v2.6/text-to-image","name":"Wan v2.6 Text to Image","created_by":"wan","source":"official","description":"Wan 2.6 text-to-image model.","status":"active","release_date":"2025-12-23","model_type":"image","page_url":"https://fal.run/wan/v2.6/text-to-image","tagline":"Wan 2.6 text-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-20","last_updated":"2026-05-11"},{"id":"wan/v2.6/text-to-video","name":"Wan v2.6 Text to Video","created_by":"wan","source":"official","description":"Wan 2.6 text-to-video model.","status":"active","release_date":"2025-12-16","model_type":"video","page_url":"https://fal.run/wan/v2.6/text-to-video","tagline":"Wan 2.6 text-to-video model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-image/edit","name":"Grok Imagine Image","created_by":"xai","source":"official","family":"grok-imagine","description":"Edit images precisely with xAI's Grok Imagine model","status":"active","release_date":"2026-01-29","model_type":"image","page_url":"https://fal.run/xai/grok-imagine-image/edit","tagline":"Edit images precisely with xAI's Grok Imagine model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-image/quality/edit","name":"Grok Imagine Image Editing Quality","created_by":"xai","source":"official","family":"grok-imagine","description":"Grok Imagine Pro is an advanced AI model from xAI that creates high-quality visuals from text prompts and allows you to edit or analyze existing images.","status":"active","release_date":"2026-04-09","model_type":"image","page_url":"https://fal.run/xai/grok-imagine-image/quality/edit","tagline":"Grok Imagine Pro is an advanced AI model from xAI that creates high-quality visuals from text prompts and allows you to edit or analyze existing images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-image/quality/text-to-image","name":"Grok Imagine Image","created_by":"xai","source":"official","family":"grok-imagine","description":"Grok Imagine Pro is an advanced AI model from xAI that creates high-quality visuals from text prompts and allows you to edit or analyze existing images.","status":"active","release_date":"2026-04-09","model_type":"image","page_url":"https://fal.run/xai/grok-imagine-image/quality/text-to-image","tagline":"Grok Imagine Pro is an advanced AI model from xAI that creates high-quality visuals from text prompts and allows you to edit or analyze existing images.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-image","name":"Grok Imagine Image","created_by":"xai","source":"official","family":"grok-imagine","description":"Generate highly aesthetic images with xAI's Grok Imagine Image generation model.","status":"active","release_date":"2026-01-29","model_type":"image","page_url":"https://fal.run/xai/grok-imagine-image","tagline":"Generate highly aesthetic images with xAI's Grok Imagine Image generation model.","capabilities":{"vision":true,"streaming":true,"tool_call":true,"batch":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11","license":"proprietary","open_weight":false},{"id":"xai/grok-imagine-video/edit-video","name":"Grok Imagine Video","created_by":"xai","source":"official","family":"grok-imagine","description":"Edit videos using xAI's Grok Imagine","status":"active","release_date":"2026-01-29","model_type":"other","page_url":"https://fal.run/xai/grok-imagine-video/edit-video","tagline":"Edit videos using xAI's Grok Imagine","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-video/extend-video","name":"Grok Imagine Extend Video","created_by":"xai","source":"official","family":"grok-imagine","description":"Extend videos with xAI's Grok Imagine video model","status":"active","release_date":"2026-03-24","model_type":"other","page_url":"https://fal.run/xai/grok-imagine-video/extend-video","tagline":"Extend videos with xAI's Grok Imagine video model","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-video/image-to-video","name":"Grok Imagine Video","created_by":"xai","source":"official","family":"grok-imagine","description":"Generate videos from images with audio using xAI's Grok Imagine Video model.","status":"active","release_date":"2026-01-29","model_type":"video","page_url":"https://fal.run/xai/grok-imagine-video/image-to-video","tagline":"Generate videos from images with audio using xAI's Grok Imagine Video model.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-video/reference-to-video","name":"Grok Imagine Reference to Video","created_by":"xai","source":"official","family":"grok-imagine","description":"Generate videos using multiple reference images with xAI's Grok Imagine video model","status":"active","release_date":"2026-03-24","model_type":"video","page_url":"https://fal.run/xai/grok-imagine-video/reference-to-video","tagline":"Generate videos using multiple reference images with xAI's Grok Imagine video model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-video/text-to-video","name":"Grok Imagine Video","created_by":"xai","source":"official","family":"grok-imagine","description":"Generate videos with audio from text using Grok Imagine Video.","status":"active","release_date":"2026-01-29","model_type":"video","page_url":"https://fal.run/xai/grok-imagine-video/text-to-video","tagline":"Generate videos with audio from text using Grok Imagine Video.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-video/v1.5/image-to-video","name":"Grok Imagine Video 1.5","created_by":"xai","source":"official","family":"grok-imagine","description":"Generate videos from images with audio using xAI's Grok Imagine 1.5 Video model.","status":"active","release_date":"2026-05-31","model_type":"video","page_url":"https://fal.run/xai/grok-imagine-video/v1.5/image-to-video","tagline":"Generate videos from images with audio using xAI's Grok Imagine 1.5 Video model.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-02","last_updated":"2026-06-03"},{"id":"xai/tts/v1","name":"xAI Text to Speech","created_by":"xai","source":"official","family":"tts","description":"Generate speech with expressive and realistic voices from xAI","status":"active","release_date":"2026-03-17","model_type":"tts","page_url":"https://fal.run/xai/tts/v1","tagline":"Generate speech with expressive and realistic voices from xAI","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-02","last_updated":"2026-06-03"}]}; +export const provider: ProviderWithModels = {"id":"fal","name":"fal","region":"US","url":"https://fal.ai","api_url":"https://fal.run","docs_url":"https://fal.ai/docs","pricing_url":"https://fal.ai/pricing","description":"Generative media inference platform for image, video, audio, and multimodal model APIs.","type":"cloud","models_url":"https://api.fal.ai/v1/models","openai_compatible":false,"free_tier":false,"github_url":"https://github.com/fal-ai","twitter_url":"https://x.com/fal","icon":"\n \n","models":[{"id":"alibaba/happy-horse/image-to-video","name":"Happy Horse","created_by":"alibaba","source":"official","description":"Alibaba's #1-ranked Happy Horse 1.0 — generate 1080p video with synchronized native audio and multilingual lip-sync from text prompts or images.","status":"active","release_date":"2026-04-24","model_type":"video","page_url":"https://fal.run/alibaba/happy-horse/image-to-video","tagline":"Alibaba's #1-ranked Happy Horse 1.0 — generate 1080p video with synchronized native audio and multilingual lip-sync from text prompts or images.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"alibaba/happy-horse/reference-to-video","name":"Happy Horse","created_by":"alibaba","source":"official","description":"Generate 1080p video with synchronized native audio from a text prompt and references.","status":"active","release_date":"2026-04-27","model_type":"video","page_url":"https://fal.run/alibaba/happy-horse/reference-to-video","tagline":"Generate 1080p video with synchronized native audio from a text prompt and references.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"alibaba/happy-horse/text-to-video","name":"Happy Horse","created_by":"alibaba","source":"official","description":"Generate 1080p video with synchronized native audio from a text prompt.","status":"active","release_date":"2026-04-24","model_type":"video","page_url":"https://fal.run/alibaba/happy-horse/text-to-video","tagline":"Generate 1080p video with synchronized native audio from a text prompt.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"alibaba/happy-horse/v1.1/image-to-video","name":"Happy Horse 1.1 Image to Video","created_by":"alibaba","source":"official","description":"Happy Horse 1.1 is Alibaba's #1-ranked video model.","status":"active","release_date":"2026-06-21","model_type":"video","page_url":"https://fal.run/alibaba/happy-horse/v1.1/image-to-video","tagline":"Happy Horse 1.1 is Alibaba's #1-ranked video model.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"alibaba/happy-horse/v1.1/reference-to-video","name":"Happy Horse 1.1 Reference to Video","created_by":"alibaba","source":"official","description":"Happy Horse 1.1 is Alibaba's #1-ranked video model.","status":"active","release_date":"2026-06-21","model_type":"video","page_url":"https://fal.run/alibaba/happy-horse/v1.1/reference-to-video","tagline":"Happy Horse 1.1 is Alibaba's #1-ranked video model.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"alibaba/happy-horse/v1.1/text-to-video","name":"Happy Horse 1.1 Text to Video","created_by":"alibaba","source":"official","description":"Happy Horse 1.1 is Alibaba's #1-ranked video model.","status":"active","release_date":"2026-06-21","model_type":"video","page_url":"https://fal.run/alibaba/happy-horse/v1.1/text-to-video","tagline":"Happy Horse 1.1 is Alibaba's #1-ranked video model.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"alibaba/happy-horse/video-edit","name":"Happy Horse Video Edit","created_by":"alibaba","source":"official","description":"HappyHorse video editing supports advanced video editing through natural language instructions.","status":"active","release_date":"2026-04-27","model_type":"other","page_url":"https://fal.run/alibaba/happy-horse/video-edit","tagline":"HappyHorse video editing supports advanced video editing through natural language instructions.","capabilities":{"vision":true},"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"argil/avatars/audio-to-video","name":"Avatars Audio to Video","created_by":"argil","source":"official","description":"High-quality avatar videos that feel real, generated from your audio","status":"active","release_date":"2025-09-01","model_type":"other","page_url":"https://fal.run/argil/avatars/audio-to-video","tagline":"High-quality avatar videos that feel real, generated from your audio","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"argil/avatars/text-to-video","name":"Avatars Text to Video","created_by":"argil","source":"official","description":"High-quality avatar videos that feel real, generated from your text","status":"active","release_date":"2025-09-01","model_type":"video","page_url":"https://fal.run/argil/avatars/text-to-video","tagline":"High-quality avatar videos that feel real, generated from your text","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"async/tts-pro/v1.0","name":"Async Text to Speech Pro V1.0","created_by":"async","source":"official","family":"tts","description":"Generate professional-quality voiceovers in seconds with Async TTS Pro model text-based control over pauses, emphasis, and timing.","status":"active","release_date":"2026-06-18","model_type":"tts","page_url":"https://fal.run/async/tts-pro/v1.0","tagline":"Generate professional-quality voiceovers in seconds with Async TTS Pro model text-based control over pauses, emphasis, and timing.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-18","last_updated":"2026-06-20"},{"id":"bria/bria_video_eraser/erase/keypoints","name":"Bria Video Eraser","created_by":"bria","source":"official","description":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency.","status":"active","release_date":"2025-12-17","model_type":"other","page_url":"https://fal.run/bria/bria_video_eraser/erase/keypoints","tagline":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"bria/bria_video_eraser/erase/mask","name":"Bria Video Eraser Erase Mask","created_by":"bria","source":"official","description":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency.","status":"active","release_date":"2025-12-17","model_type":"other","page_url":"https://fal.run/bria/bria_video_eraser/erase/mask","tagline":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency.","last_seen_at":"2026-01-26","last_updated":"2026-06-03"},{"id":"bria/bria_video_eraser/erase/prompt","name":"Bria Video Eraser","created_by":"bria","source":"official","description":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency","status":"active","release_date":"2025-12-17","model_type":"other","page_url":"https://fal.run/bria/bria_video_eraser/erase/prompt","tagline":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"bria/embed-product","name":"Embed Product","created_by":"bria","source":"official","family":"embed","description":"Seamlessly embed products into any scene with pixel-perfect control, automatic perspective, and natural lighting.","status":"active","release_date":"2026-02-25","model_type":"image","page_url":"https://fal.run/bria/embed-product","tagline":"Seamlessly integrate one or more products into a predefined scene with pixel-perfect control.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/extract-object","name":"Extract Object","created_by":"bria","source":"official","description":"Bria Extract Object uses text prompts to isolate a selected object from an image and return it as an RGBA PNG with a transparent background.","status":"active","release_date":"2026-06-28","model_type":"image","page_url":"https://fal.run/bria/extract-object","tagline":"Bria Extract Object uses text prompts to isolate a selected object from an image and return it as an RGBA PNG with a transparent background.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-29","last_updated":"2026-06-30"},{"id":"bria/fibo-bbq-preview/generate","name":"Fibo Bbq Preview","created_by":"bria","source":"official","description":"A preview to the next level of control of Text-to-Image models.","status":"active","release_date":"2026-03-02","model_type":"image","page_url":"https://fal.run/bria/fibo-bbq-preview/generate","tagline":"A preview to the next level of control of Text-to-Image models.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-02","last_updated":"2026-05-11"},{"id":"bria/fibo-edit/add_object_by_text","name":"Fibo Edit [Add Object by Text]","created_by":"bria","source":"official","description":"Precisely insert new objects into images with structured spatial commands.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/add_object_by_text","tagline":"Precise, context-aware insertion of new objects into an existing image using simple, structured spatial commands.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/blend","name":"Fibo Edit [Blend]","created_by":"bria","source":"official","description":"image composition model.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/blend","tagline":"Complex, multi-step visual composition through natural language.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/colorize","name":"Fibo Edit [Colorize]","created_by":"bria","source":"official","description":"Image colorization and color-grading model.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/colorize","tagline":"Transforms the color treatment of images using predefined, style-based commands","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/edit/structured_instruction","name":"Fibo Edit [Structured Instruction]","created_by":"bria","source":"official","description":"Structured Instructions Generation endpoint for Fibo Edit, Bria's newest editing model.","status":"active","release_date":"2026-01-20","model_type":"other","page_url":"https://fal.run/bria/fibo-edit/edit/structured_instruction","tagline":"Structured Instructions Generation endpoint for Fibo Edit, Bria's newest editing model.","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"bria/fibo-edit/edit","name":"Fibo Edit","created_by":"bria","source":"official","description":"High-fidelity image editing model with state-of-the-art controllability.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/edit","tagline":"A high-quality editing model that achieves maximum controllability and transparency by combining JSON + Mask + Image.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/erase_by_text","name":"Fibo Edit [Erase by Text]","created_by":"bria","source":"official","description":"Remove unwanted objects from images with a text prompt - fast, precise editing that seamlessly blends results.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/erase_by_text","tagline":"Fast, reliable removal of unwanted elements from images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/relight","name":"Fibo Edit [Relight]","created_by":"bria","source":"official","description":"Precise, controllable photo re-lighting with structured text inputs.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/relight","tagline":"Precise, controllable lighting changes using simple, structured text inputs.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/replace_object_by_text","name":"Fibo Edit [Replace Object by Text]","created_by":"bria","source":"official","description":"Replace any object in an image using plain language with fine-grained, precise edits and strong prompt adherence.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/replace_object_by_text","tagline":"Natural, expressive object swapping within images using plain language","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/reseason","name":"Fibo Edit [Reseason]","created_by":"bria","source":"official","description":"Transform the season or weather of an image - summer to winter, sunny to rainy - with realistic atmosphere and lighting.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/reseason","tagline":"Transforms the seasonal or weather atmosphere of an image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/restore","name":"Fibo Edit [Restore]","created_by":"bria","source":"official","description":"Photo restoration model that automatically denoises, deblurs, and enhances old or damaged photos - removes imperfections while preserving original character.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/restore","tagline":"Automatically renews and cleans noisy or degraded images.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/restyle","name":"Fibo Edit [Restyle]","created_by":"bria","source":"official","description":"Production-grade style transfer that maps photos to distinct artistic styles using curated, brand-safe presets.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/restyle","tagline":"Transforms images into distinct artistic styles using curated, production-grade style mappings","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/rewrite_text","name":"Fibo Edit [Rewrite Text]","created_by":"bria","source":"official","description":"Precisely rewrite text inside images while preserving typography, fonts, and layout.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/rewrite_text","tagline":"Precise, reliable modification of existing text inside images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-edit/sketch_to_colored_image","name":"Fibo Edit [Sketch to Image]","created_by":"bria","source":"official","description":"Convert line drawings and sketches into photorealistic, fully colored images with preserved structure.","status":"active","release_date":"2026-01-20","model_type":"image","page_url":"https://fal.run/bria/fibo-edit/sketch_to_colored_image","tagline":"Converts line drawings and sketches into photorealistic, fully colored images","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo/generate/structured_prompt","name":"Fibo","created_by":"bria","source":"official","description":"Structured Prompt Generation endpoint for Fibo, Bria's SOTA Open source model.","status":"active","release_date":"2025-10-29","model_type":"other","page_url":"https://fal.run/bria/fibo/generate/structured_prompt","tagline":"Structured Prompt Generation endpoint for Fibo, Bria's SOTA Open source model","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo/generate","name":"Fibo","created_by":"bria","source":"official","description":"SOTA open-source text-to-image model delivering high-fidelity outputs with accurate typography.","status":"active","release_date":"2025-10-29","model_type":"image","page_url":"https://fal.run/bria/fibo/generate","tagline":"SOTA Open source model trained on licensed data, transforming intent into structured control for precise, high-quality AI image generation in enterprise and agentic workflows.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-lite/generate/structured_prompt/lite","name":"Fibo Lite","created_by":"bria","source":"official","description":"Structured Prompt Generation endpoint for Fibo-Lite, Bria's SOTA Open source model","status":"active","release_date":"2026-01-19","model_type":"other","page_url":"https://fal.run/bria/fibo-lite/generate/structured_prompt/lite","tagline":"Structured Prompt Generation endpoint for Fibo-Lite, Bria's SOTA Open source model","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"bria/fibo-lite/generate/structured_prompt","name":"Fibo Lite","created_by":"bria","source":"official","description":"Convert plain text into Fibo-Lite's transparent JSON-structured prompts - Bria's unique controllability layer that no closed model offers.","status":"active","release_date":"2026-01-19","model_type":"other","page_url":"https://fal.run/bria/fibo-lite/generate/structured_prompt","tagline":"Structured Prompt Generation endpoint for Fibo-Lite, Bria's SOTA Open source model","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/fibo-lite/generate","name":"Fibo Lite","created_by":"bria","source":"official","description":"Fast, low-latency text-to-image model with high-quality output and full JSON-structured controllability.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/bria/fibo-lite/generate","tagline":"Fibo Lite, the new addition to the Fibo model family, allows generating high-quality images with the same controllability of the JSON structured prompt with significantly improved latency.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/genfill/v2","name":"Genfill","created_by":"bria","source":"official","description":"The GenFill Route enables the generation of objects by prompt in a specific region of an image.","status":"active","release_date":"2026-06-08","model_type":"image","page_url":"https://fal.run/bria/genfill/v2","tagline":"The GenFill Route enables the generation of objects by prompt in a specific region of an image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-10","last_updated":"2026-06-18"},{"id":"bria/reimagine/3.2","name":"Reimagine","created_by":"bria","source":"official","description":"Reimagine uses a structure reference for generating new images while preserving the structure of an input image, guided by text prompts.","status":"active","release_date":"2025-08-20","model_type":"image","page_url":"https://fal.run/bria/reimagine/3.2","tagline":"Reimagine uses a structure reference for generating new images while preserving the structure of an input image, guided by text prompts.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"bria/replace-background","name":"Replace Background","created_by":"bria","source":"official","description":"Generate professional, eCommerce-ready product shots by replacing backgrounds with realistic lighting and accurate perspective from a simple text prompt.","status":"active","release_date":"2026-01-27","model_type":"image","page_url":"https://fal.run/bria/replace-background","tagline":"Creates enriched product shots by placing them in various environments using textual descriptions.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/text-to-image/3.2","name":"Bria 3.2 Text-to-Image","created_by":"bria","source":"official","description":"Bria’s Text-to-Image model, trained exclusively on licensed data for safe and risk-free commercial use.","status":"active","release_date":"2025-06-17","model_type":"image","page_url":"https://fal.run/bria/text-to-image/3.2","tagline":"Bria’s Text-to-Image model, trained exclusively on licensed data for safe and risk-free commercial use.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"bria/upscale/creative","name":"Upscale","created_by":"bria","source":"official","description":"Professional-grade creative upscaler that doubles resolution up to 10MP, regenerating sharper textures, refined details, and cleaner faces.","status":"active","release_date":"2026-02-23","model_type":"image","page_url":"https://fal.run/bria/upscale/creative","tagline":"Regenerate the image with sharper textures and richer details while doubling resolution, up to 10 megapixels output.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/video/background-removal/realtime","name":"Bria's VRMBG 3.0 Realtime","created_by":"bria","source":"official","description":"Remove video backgrounds in real time with Bria’s VRMBG 3.0 model.","status":"active","release_date":"2026-06-09","model_type":"other","page_url":"https://fal.run/bria/video/background-removal/realtime","tagline":"Remove video backgrounds in real time with Bria’s VRMBG 3.0 model.","last_seen_at":"2026-06-14","last_updated":"2026-06-18"},{"id":"bria/video/background-removal/v3","name":"Bria's VRMBG 3.0","created_by":"bria","source":"official","description":"Remove backgrounds from any video with Bria's VRMBG 3.0.","status":"active","release_date":"2026-06-08","model_type":"other","page_url":"https://fal.run/bria/video/background-removal/v3","tagline":"Remove backgrounds from any video with Bria's VRMBG 3.0.","last_seen_at":"2026-06-14","last_updated":"2026-06-18"},{"id":"bria/video/background-removal","name":"Video","created_by":"bria","source":"official","description":"Automatically remove backgrounds from videos -perfect for creating clean, professional content without a green screen.","status":"active","release_date":"2025-06-30","model_type":"other","page_url":"https://fal.run/bria/video/background-removal","tagline":"Automatically remove backgrounds from videos -perfect for creating clean, professional content without a green screen.","last_seen_at":"2026-06-14","last_updated":"2026-06-18"},{"id":"bria/video/erase/keypoints","name":"Video","created_by":"bria","source":"official","description":"High-fidelity keypoint-driven video object removal - minimal input, strong temporal consistency.","status":"active","release_date":"2025-12-23","model_type":"other","page_url":"https://fal.run/bria/video/erase/keypoints","tagline":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency.","last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/video/erase/mask","name":"Video","created_by":"bria","source":"official","description":"High-fidelity mask-based video object removal with strong temporal consistency.","status":"active","release_date":"2025-12-23","model_type":"other","page_url":"https://fal.run/bria/video/erase/mask","tagline":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency.","last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/video/erase/prompt","name":"Video","created_by":"bria","source":"official","description":"Erase unwanted objects, people, or elements from video with a text prompt.","status":"active","release_date":"2025-12-23","model_type":"other","page_url":"https://fal.run/bria/video/erase/prompt","tagline":"A high-fidelity capability for erasing unwanted objects, people, or visual elements from videos while maintaining aesthetic quality and temporal consistency","last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"bria/video/increase-resolution","name":"Video","created_by":"bria","source":"official","description":"Professional-grade video upscaler with strong temporal consistency, enhancing videos up to 8K resolution.","status":"active","release_date":"2025-08-26","model_type":"other","page_url":"https://fal.run/bria/video/increase-resolution","tagline":"Upscale videos up to 8K output resolution.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"bytedance/lynx","name":"Lynx","created_by":"bytedance","source":"official","description":"Generate subject consistent videos using Lynx from ByteDance!","status":"active","release_date":"2025-11-18","model_type":"video","page_url":"https://fal.run/bytedance/lynx","tagline":"Generate subject consistent videos using Lynx from ByteDance!","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"bytedance/seed-audio-1.0","name":"Seed Audio 1.0","created_by":"bytedance","source":"official","description":"Seed Audio 1.0 is a new audio model from Bytedance that can generate high-quality, natural sounding audio using text, reference audios or an image.","status":"active","release_date":"2026-06-25","model_type":"other","page_url":"https://fal.run/bytedance/seed-audio-1.0","tagline":"Seed Audio 1.0 is a new audio model from Bytedance that can generate high-quality, natural sounding audio using text, reference audios or an image.","capabilities":{"vision":true},"last_seen_at":"2026-06-26","last_updated":"2026-06-29"},{"id":"bytedance/seedance-2.0/fast/image-to-video","name":"Seedance 2.0 Fast Image to Video","created_by":"bytedance","source":"official","description":"ByteDance's most advanced image-to-video model, fast tier.","status":"active","release_date":"2026-04-01","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/fast/image-to-video","tagline":"ByteDance's most advanced image-to-video model, fast tier.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-22","last_updated":"2026-05-11"},{"id":"bytedance/seedance-2.0/fast/reference-to-video","name":"Seedance 2.0 Fast Reference to Video","created_by":"bytedance","source":"official","description":"ByteDance's most advanced reference-to-video model, fast tier.","status":"active","release_date":"2026-04-01","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/fast/reference-to-video","tagline":"ByteDance's most advanced reference-to-video model, fast tier.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-05-29","last_updated":"2026-06-03"},{"id":"bytedance/seedance-2.0/fast/text-to-video","name":"Seedance 2.0 Fast Text to Video","created_by":"bytedance","source":"official","description":"ByteDance's most advanced text-to-video model, fast tier.","status":"active","release_date":"2026-04-01","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/fast/text-to-video","tagline":"ByteDance's most advanced text-to-video model, fast tier.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-05-29","last_updated":"2026-06-03"},{"id":"bytedance/seedance-2.0/image-to-video","name":"Seedance 2 Image to Video","created_by":"bytedance","source":"official","description":"ByteDance's most advanced image-to-video model.","status":"active","release_date":"2026-04-01","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/image-to-video","tagline":"ByteDance's most advanced image-to-video model.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"bytedance/seedance-2.0/mini/image-to-video","name":"Seedance 2.0 Mini Image to Video","created_by":"bytedance","source":"official","description":"Seedance 2.0 Mini is a faster version of Seedance 2.0 that brings great performance and high generation speed at a lower cost.","status":"active","release_date":"2026-06-23","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/mini/image-to-video","tagline":"Seedance 2.0 Mini is a faster version of Seedance 2.0 that brings great performance and high generation speed at a lower cost.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"bytedance/seedance-2.0/mini/reference-to-video","name":"Seedance 2.0 Mini","created_by":"bytedance","source":"official","description":"Seedance 2.0 Mini is a faster version of Seedance 2.0 that brings great performance and high generation speed at a lower cost.","status":"active","release_date":"2026-06-23","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/mini/reference-to-video","tagline":"Seedance 2.0 Mini is a faster version of Seedance 2.0 that brings great performance and high generation speed at a lower cost.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"bytedance/seedance-2.0/mini/text-to-video","name":"Seedance 2.0 Mini Text to Video","created_by":"bytedance","source":"official","description":"Seedance 2.0 Mini is a faster version of Seedance 2.0 that brings great performance and high generation speed at a lower cost.","status":"active","release_date":"2026-06-23","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/mini/text-to-video","tagline":"Seedance 2.0 Mini is a faster version of Seedance 2.0 that brings great performance and high generation speed at a lower cost.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"bytedance/seedance-2.0/reference-to-video","name":"Seedance 2 Reference to Video","created_by":"bytedance","source":"official","description":"ByteDance's most advanced reference-to-video model.","status":"active","release_date":"2026-04-01","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/reference-to-video","tagline":"ByteDance's most advanced reference-to-video model.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"bytedance/seedance-2.0/text-to-video","name":"Seedance 2.0 Text to Video API","created_by":"bytedance","source":"official","description":"ByteDance's most advanced text-to-video model.","status":"active","release_date":"2026-04-01","model_type":"video","page_url":"https://fal.run/bytedance/seedance-2.0/text-to-video","tagline":"ByteDance's most advanced text-to-video model.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-23","last_updated":"2026-06-29"},{"id":"cassetteai/music-generator","name":"music generator","created_by":"cassetteai","source":"official","description":"CassetteAI’s model generates a 30-second sample in under 2 seconds and a full 3-minute track in under 10 seconds.","status":"active","release_date":"2025-03-27","model_type":"other","page_url":"https://fal.run/CassetteAI/music-generator","tagline":"CassetteAI’s model generates a 30-second sample in under 2 seconds and a full 3-minute track in under 10 seconds.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"cassetteai/sound-effects-generator","name":"Sound Effects Generator","created_by":"cassetteai","source":"official","description":"Create stunningly realistic sound effects in seconds - CassetteAI's Sound Effects Model generates high-quality SFX up to 30 seconds long in just 1 second of processing time","status":"active","release_date":"2025-04-03","model_type":"other","page_url":"https://fal.run/cassetteai/sound-effects-generator","tagline":"Create stunningly realistic sound effects in seconds - CassetteAI's Sound Effects Model generates high-quality SFX up to 30 seconds long in just 1 second of processing time","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"cassetteai/video-sound-effects-generator","name":"Video Sound Effects Generator","created_by":"cassetteai","source":"official","description":"Add sound effects to your videos","status":"active","release_date":"2025-04-07","model_type":"other","page_url":"https://fal.run/cassetteai/video-sound-effects-generator","tagline":"Add sound effects to your videos","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"clarityai/crystal-upscaler","name":"Crystal Upscaler","created_by":"clarityai","source":"official","description":"An advanced image enhancement tool designed specifically for facial details and portrait photography, utilizing Clarity AI's upscaling technology.","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/clarityai/crystal-upscaler","tagline":"An advanced image enhancement tool designed specifically for facial details and portrait photography, utilizing Clarity AI's upscaling technology.","capabilities":{"vision":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"tools":["function_calling"],"last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"clarityai/crystal-video-upscaler","name":"Crystal Upscaler [Video]","created_by":"clarityai","source":"official","description":"Do high precision video upscaling that respects the original video perfectly using Crystal Upscaler's new video upscaling method!","status":"active","release_date":"2025-12-17","model_type":"other","page_url":"https://fal.run/clarityai/crystal-video-upscaler","tagline":"Do high precision video upscaling that respects the original video perfectly using Crystal Upscaler's new video upscaling method!","last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"decart/lucy-edit/pro","name":"Lucy Edit [Pro]","created_by":"decart","source":"official","description":"Edit outfits, objects, faces, or restyle your video - all with maximum detail retention.","status":"active","release_date":"2025-09-18","model_type":"other","page_url":"https://fal.run/decart/lucy-edit/pro","tagline":"Edit outfits, objects, faces, or restyle your video - all with maximum detail retention.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"decart/lucy-restyle","name":"Lucy Restyle","created_by":"decart","source":"official","description":"Restyle videos up to 30 min long - maintaining maximum detail quality.","status":"active","release_date":"2025-12-18","model_type":"other","page_url":"https://fal.run/decart/lucy-restyle","tagline":"Restyle videos up to 30 min long - maintaining maximum detail quality.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"decart/lucy2-vton/realtime","name":"Lucy 2.1 VTON Realtime","created_by":"decart","source":"official","description":"Realtime Try On experience with Decart Lucy 2.1 VTON","status":"active","release_date":"2026-04-29","model_type":"other","page_url":"https://fal.run/decart/lucy2-vton/realtime","tagline":"Realtime Try On experience with Decart Lucy 2.1 VTON","last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/ace-step/audio-inpaint","name":"ACE Step Audio Inpaint","created_by":"fal","source":"official","description":"Modify a portion of provided audio with lyrics and/or style using ACE-Step","status":"active","release_date":"2025-05-11","model_type":"other","page_url":"https://fal.run/fal-ai/ace-step/audio-inpaint","tagline":"Modify a portion of provided audio with lyrics and/or style using ACE-Step","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/ace-step/audio-outpaint","name":"ACE Step Audio Outpaint","created_by":"fal","source":"official","description":"Extend the beginning or end of provided audio with lyrics and/or style using ACE-Step","status":"active","release_date":"2025-05-11","model_type":"other","page_url":"https://fal.run/fal-ai/ace-step/audio-outpaint","tagline":"Extend the beginning or end of provided audio with lyrics and/or style using ACE-Step","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/ace-step/audio-to-audio","name":"ACE Step Audio To Audio","created_by":"fal","source":"official","description":"Generate music from a lyrics and example audio using ACE-Step","status":"active","release_date":"2025-05-11","model_type":"other","page_url":"https://fal.run/fal-ai/ace-step/audio-to-audio","tagline":"Generate music from a lyrics and example audio using ACE-Step","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ace-step/prompt-to-audio","name":"ACE Step Prompt To Audio","created_by":"fal","source":"official","description":"Generate music from a simple prompt using ACE-Step","status":"active","release_date":"2025-05-11","model_type":"other","page_url":"https://fal.run/fal-ai/ace-step/prompt-to-audio","tagline":"Generate music from a simple prompt using ACE-Step","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ace-step","name":"ACE Step","created_by":"fal","source":"official","description":"Generate music with lyrics from text using ACE-Step","status":"active","release_date":"2025-05-08","model_type":"other","page_url":"https://fal.run/fal-ai/ace-step","tagline":"Generate music with lyrics from text using ACE-Step","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ai-avatar/multi-text","name":"AI Avatar Multi Text","created_by":"fal","source":"official","description":"MultiTalk model generates a multi-person conversation video from an image and text inputs.","status":"active","release_date":"2025-06-23","model_type":"video","page_url":"https://fal.run/fal-ai/ai-avatar/multi-text","tagline":"MultiTalk model generates a multi-person conversation video from an image and text inputs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/ai-avatar/multi","name":"AI Avatar Multi","created_by":"fal","source":"official","description":"MultiTalk model generates a multi-person conversation video from an image and audio files.","status":"active","release_date":"2025-06-23","model_type":"video","page_url":"https://fal.run/fal-ai/ai-avatar/multi","tagline":"MultiTalk model generates a multi-person conversation video from an image and audio files.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/ai-avatar/single-text","name":"AI Avatar Single Text","created_by":"fal","source":"official","description":"MultiTalk model generates a talking avatar video from an image and text.","status":"active","release_date":"2025-06-23","model_type":"video","page_url":"https://fal.run/fal-ai/ai-avatar/single-text","tagline":"MultiTalk model generates a talking avatar video from an image and text.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ai-avatar","name":"Ai Avatar","created_by":"fal","source":"official","description":"MultiTalk model generates a talking avatar video from an image and audio file.","status":"active","release_date":"2025-06-23","model_type":"video","page_url":"https://fal.run/fal-ai/ai-avatar","tagline":"MultiTalk model generates a talking avatar video from an image and audio file.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/amt-interpolation/frame-interpolation","name":"AMT Frame Interpolation","created_by":"fal","source":"official","description":"Interpolate between image frames","status":"active","release_date":"2024-07-18","model_type":"video","page_url":"https://fal.run/fal-ai/amt-interpolation/frame-interpolation","tagline":"Interpolate between image frames","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/amt-interpolation","name":"AMT Interpolation","created_by":"fal","source":"official","description":"Interpolate between video frames","status":"active","release_date":"2024-02-21","model_type":"other","page_url":"https://fal.run/fal-ai/amt-interpolation","tagline":"Interpolate between video frames","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/animatediff-sparsectrl-lcm","name":"Animatediff SparseCtrl LCM","created_by":"fal","source":"official","description":"Animate Your Drawings with Latent Consistency Models!","status":"active","release_date":"2023-11-09","model_type":"video","page_url":"https://fal.run/fal-ai/animatediff-sparsectrl-lcm","tagline":"Animate Your Drawings with Latent Consistency Models!","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/arbiter/image/image","name":"Arbiter","created_by":"fal","source":"official","description":"Image reference comparison measurements","status":"active","release_date":"2025-12-26","model_type":"other","page_url":"https://fal.run/fal-ai/arbiter/image/image","tagline":"Image reference comparison measurements","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/arbiter/image/text","name":"Arbiter","created_by":"fal","source":"official","description":"Semantic image alignment measurements","status":"active","release_date":"2025-12-26","model_type":"other","page_url":"https://fal.run/fal-ai/arbiter/image/text","tagline":"Semantic image alignment measurements","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/arbiter/image","name":"Arbiter","created_by":"fal","source":"official","description":"Reference-free image measurements","status":"active","release_date":"2025-12-26","model_type":"other","page_url":"https://fal.run/fal-ai/arbiter/image","tagline":"Reference-free image measurements","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/audio-understanding","name":"Audio Understanding","created_by":"fal","source":"official","description":"A audio understanding model to analyze audio content and answer questions about what's happening in the audio based on user prompts.","status":"active","release_date":"2025-10-24","model_type":"other","page_url":"https://fal.run/fal-ai/audio-understanding","tagline":"A audio understanding model to analyze audio content and answer questions about what's happening in the audio based on user prompts.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/aura-flow","name":"AuraFlow","created_by":"fal","source":"official","description":"AuraFlow v0.3 is an open-source flow-based text-to-image generation model that achieves state-of-the-art results on GenEval.","status":"active","release_date":"2024-12-02","model_type":"image","page_url":"https://fal.run/fal-ai/aura-flow","tagline":"AuraFlow v0.3 is an open-source flow-based text-to-image generation model that achieves state-of-the-art results on GenEval.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-05","last_updated":"2026-05-11"},{"id":"fal-ai/aura-sr","name":"AuraSR","created_by":"fal","source":"official","description":"Upscale your images with AuraSR.","status":"active","release_date":"2024-04-11","model_type":"image","page_url":"https://fal.run/fal-ai/aura-sr","tagline":"Upscale your images with AuraSR.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-05","last_updated":"2026-05-11"},{"id":"fal-ai/auto-caption","name":"Auto-Captioner","created_by":"fal","source":"official","description":"Automatically generates text captions for your videos from the audio as per text colour/font specifications","status":"active","release_date":"2025-01-03","model_type":"other","page_url":"https://fal.run/fal-ai/auto-caption","tagline":"Automatically generates text captions for your videos from the audio as per text colour/font specifications","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bagel/edit","name":"Bagel","created_by":"fal","source":"official","description":"Bagel is a 7B parameter multimodal model from Bytedance-Seed that can generate both images and text.","status":"active","release_date":"2025-05-21","model_type":"image","page_url":"https://fal.run/fal-ai/bagel/edit","tagline":"Bagel is a 7B parameter multimodal model from Bytedance-Seed that can generate both images and text.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bagel/understand","name":"Bagel","created_by":"fal","source":"official","description":"Bagel is a 7B parameter multimodal model from Bytedance-Seed that can generate both text and images.","status":"active","release_date":"2025-05-21","model_type":"other","page_url":"https://fal.run/fal-ai/bagel/understand","tagline":"Bagel is a 7B parameter multimodal model from Bytedance-Seed that can generate both text and images.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/bagel","name":"Bagel","created_by":"fal","source":"official","description":"Bagel is a 7B parameter from Bytedance-Seed multimodal model that can generate both text and images.","status":"active","release_date":"2025-05-21","model_type":"image","page_url":"https://fal.run/fal-ai/bagel","tagline":"Bagel is a 7B parameter from Bytedance-Seed multimodal model that can generate both text and images.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ben/v2/image","name":"ben-v2-image","created_by":"fal","source":"official","description":"A fast and high quality model for image background removal.","status":"active","release_date":"2025-02-11","model_type":"image","page_url":"https://fal.run/fal-ai/ben/v2/image","tagline":"A fast and high quality model for image background removal.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ben/v2/video","name":"Ben-Video-Bg-Rm","created_by":"fal","source":"official","description":"A model for high quality and smooth background removal for videos.","status":"active","release_date":"2025-02-11","model_type":"other","page_url":"https://fal.run/fal-ai/ben/v2/video","tagline":"A model for high quality and smooth background removal for videos.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bernini-r/edit-image","name":"Bernini-R Edit Image","created_by":"fal","source":"official","description":"Edit any image with a natural-language instruction using Bernini-R, changing the weather, materials, objects, or style while preserving the original composition.","status":"active","release_date":"2026-06-08","model_type":"image","page_url":"https://fal.run/fal-ai/bernini-r/edit-image","tagline":"Edit any image with a natural-language instruction using Bernini-R, changing the weather, materials, objects, or style while preserving the original composition.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-09","last_updated":"2026-06-10"},{"id":"fal-ai/bernini-r/edit-video","name":"Bernini-R Edit Video","created_by":"fal","source":"official","description":"Edit any video with a natural-language instruction using Bernini-R, changing objects, weather, background, or camera angle while keeping the rest of the scene intact.","status":"active","release_date":"2026-06-08","model_type":"other","page_url":"https://fal.run/fal-ai/bernini-r/edit-video","tagline":"Edit any video with a natural-language instruction using Bernini-R, changing objects, weather, background, or camera angle while keeping the rest of the scene intact.","last_seen_at":"2026-06-09","last_updated":"2026-06-10"},{"id":"fal-ai/bernini-r/reference-edit-video","name":"Bernini-R Reference Edit Video","created_by":"fal","source":"official","description":"Edit a video guided by reference images with Bernini-R, bringing an object, material, background, style, or weather from a reference image into your video.","status":"active","release_date":"2026-06-08","model_type":"other","page_url":"https://fal.run/fal-ai/bernini-r/reference-edit-video","tagline":"Edit a video guided by reference images with Bernini-R, bringing an object, material, background, style, or weather from a reference image into your video.","capabilities":{"vision":true},"last_seen_at":"2026-06-09","last_updated":"2026-06-10"},{"id":"fal-ai/bernini-r/reference-to-video","name":"Bernini-R Reference to Video","created_by":"fal","source":"official","description":"Turn up to five reference images into one continuous, consistent video with Bernini-R, with smooth, stable camera motion and no scene cuts.","status":"active","release_date":"2026-06-08","model_type":"video","page_url":"https://fal.run/fal-ai/bernini-r/reference-to-video","tagline":"Turn up to five reference images into one continuous, consistent video with Bernini-R, with smooth, stable camera motion and no scene cuts.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-09","last_updated":"2026-06-10"},{"id":"fal-ai/bernini-r/text-to-video","name":"Bernini-R Text to Video","created_by":"fal","source":"official","description":"Generate high-quality video from a text prompt with Bernini-R, ByteDance's unified video generation and editing model.","status":"active","release_date":"2026-06-08","model_type":"video","page_url":"https://fal.run/fal-ai/bernini-r/text-to-video","tagline":"Generate high-quality video from a text prompt with Bernini-R, ByteDance's unified video generation and editing model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-09","last_updated":"2026-06-10"},{"id":"fal-ai/birefnet/v2/video","name":"Birefnet","created_by":"fal","source":"official","description":"Video background removal version of bilateral reference framework (BiRefNet) for high-resolution dichotomous image segmentation (DIS)\n","status":"active","release_date":"2025-10-26","model_type":"other","page_url":"https://fal.run/fal-ai/birefnet/v2/video","tagline":"Video background removal version of bilateral reference framework (BiRefNet) for high-resolution dichotomous image segmentation (DIS)\n","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/birefnet/v2","name":"Birefnet Background Removal V2","created_by":"fal","source":"official","description":"bilateral reference framework (BiRefNet) for high-resolution dichotomous image segmentation (DIS)","status":"active","release_date":"2024-10-28","model_type":"image","page_url":"https://fal.run/fal-ai/birefnet/v2","tagline":"bilateral reference framework (BiRefNet) for high-resolution dichotomous image segmentation (DIS)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-13","last_updated":"2026-06-03"},{"id":"fal-ai/birefnet","name":"Birefnet Background Removal","created_by":"fal","source":"official","description":"bilateral reference framework (BiRefNet) for high-resolution dichotomous image segmentation (DIS)","status":"active","release_date":"2024-02-27","model_type":"image","page_url":"https://fal.run/fal-ai/birefnet","tagline":"bilateral reference framework (BiRefNet) for high-resolution dichotomous image segmentation (DIS)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-13","last_updated":"2026-06-03"},{"id":"fal-ai/bitdance","name":"Bitdance","created_by":"fal","source":"official","description":"Image generation with BitDance.","status":"active","release_date":"2026-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/bitdance","tagline":"Image generation with BitDance.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-02-21","last_updated":"2026-05-11"},{"id":"fal-ai/boogu-image/edit","name":"Boogu Image","created_by":"fal","source":"official","description":"Image To Image Model using Boogu-Image","status":"active","release_date":"2026-06-18","model_type":"image","page_url":"https://fal.run/fal-ai/boogu-image/edit","tagline":"Image To Image Model using Boogu-Image","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-18","last_updated":"2026-06-18"},{"id":"fal-ai/boogu-image","name":"Boogu Image","created_by":"fal","source":"official","description":"Text To Image Model using Boogu-Image","status":"active","release_date":"2026-06-18","model_type":"image","page_url":"https://fal.run/fal-ai/boogu-image","tagline":"Text To Image Model using Boogu-Image","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-18","last_updated":"2026-06-18"},{"id":"fal-ai/bria/background/remove","name":"Bria RMBG 2.0","created_by":"fal","source":"official","description":"Bria RMBG 2.0 enables seamless removal of backgrounds from images, ideal for professional editing tasks.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/background/remove","tagline":"Bria RMBG 2.0 enables seamless removal of backgrounds from images, ideal for professional editing tasks.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/bria/background/replace","name":"Bria Background Replace","created_by":"fal","source":"official","description":"Bria Background Replace allows for efficient swapping of backgrounds in images via text prompts or reference image, delivering realistic and polished results.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/background/replace","tagline":"Bria Background Replace allows for efficient swapping of backgrounds in images via text prompts or reference image, delivering realistic and polished results.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bria/eraser","name":"Bria Eraser","created_by":"fal","source":"official","description":"Bria Eraser enables precise removal of unwanted objects from images while maintaining high-quality outputs.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/eraser","tagline":"Bria Eraser enables precise removal of unwanted objects from images while maintaining high-quality outputs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bria/expand","name":"Bria Expand Image","created_by":"fal","source":"official","description":"Bria Expand expands images beyond their borders in high quality.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/expand","tagline":"Bria Expand expands images beyond their borders in high quality.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bria/genfill","name":"Bria GenFill","created_by":"fal","source":"official","description":"Bria GenFill enables high-quality object addition or visual transformation.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/genfill","tagline":"Bria GenFill enables high-quality object addition or visual transformation.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bria/product-shot","name":"Bria Product Shot","created_by":"fal","source":"official","description":"Place any product in any scenery with just a prompt or reference image while maintaining high integrity of the product.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/product-shot","tagline":"Place any product in any scenery with just a prompt or reference image while maintaining high integrity of the product.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bria/reimagine","name":"Bria","created_by":"fal","source":"official","description":"Structure Reference allows generating new images while preserving the structure of an input image, guided by text prompts.","status":"active","release_date":"2025-07-08","model_type":"image","page_url":"https://fal.run/fal-ai/bria/reimagine","tagline":"Structure Reference allows generating new images while preserving the structure of an input image, guided by text prompts.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/bria/text-to-image/base","name":"Bria Text-to-Image Base","created_by":"fal","source":"official","description":"Bria's Text-to-Image model, trained exclusively on licensed data for safe and risk-free commercial use.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/text-to-image/base","tagline":"Bria's Text-to-Image model, trained exclusively on licensed data for safe and risk-free commercial use.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bria/text-to-image/fast","name":"Bria Text-to-Image Fast","created_by":"fal","source":"official","description":"Bria's Text-to-Image model with perfect harmony of latency and quality.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/text-to-image/fast","tagline":"Bria's Text-to-Image model with perfect harmony of latency and quality.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bria/text-to-image/hd","name":"Bria Text-to-Image HD","created_by":"fal","source":"official","description":"Bria's Text-to-Image model for HD images.","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/bria/text-to-image/hd","tagline":"Bria's Text-to-Image model for HD images.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/dreamactor/v2","name":"Bytedance Dreamactor V2","created_by":"fal","source":"official","description":"Transfer motion from a video to characters in an image using Dreamactor v2.","status":"active","release_date":"2026-02-06","model_type":"other","page_url":"https://fal.run/fal-ai/bytedance/dreamactor/v2","tagline":"Transfer motion from a video to characters in an image using Dreamactor v2.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/dreamina/v3.1/text-to-image","name":"Bytedance Dreamina V3.1 Text To Image","created_by":"fal","source":"official","description":"Dreamina showcases superior picture effects, with significant improvements in picture aesthetics, precise and diverse styles, and rich details.","status":"active","release_date":"2025-08-06","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/dreamina/v3.1/text-to-image","tagline":"Dreamina showcases superior picture effects, with significant improvements in picture aesthetics, precise and diverse styles, and rich details.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/bytedance/omnihuman/v1.5","name":"Bytedance Omnihuman V1.5","created_by":"fal","source":"official","description":"Omnihuman v1.5 is a new and improved version of Omnihuman.","status":"active","release_date":"2025-09-23","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/omnihuman/v1.5","tagline":"Omnihuman v1.5 is a new and improved version of Omnihuman.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/omnihuman","name":"OmniHuman","created_by":"fal","source":"official","description":"OmniHuman generates video using an image of a human figure paired with an audio file.","status":"active","release_date":"2025-07-27","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/omnihuman","tagline":"OmniHuman generates video using an image of a human figure paired with an audio file.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/seed-speech/tts/v2","name":"Bytedance Seed Speech Text to Speech","created_by":"fal","source":"official","description":"Seed Speech developed by ByteDance, is a family of large-scale text-to-speech models capable of synthesizing speech that is virtually indistinguishable from human speech.","status":"active","release_date":"2026-06-05","model_type":"tts","page_url":"https://fal.run/fal-ai/bytedance/seed-speech/tts/v2","tagline":"Seed Speech developed by ByteDance, is a family of large-scale text-to-speech models capable of synthesizing speech that is virtually indistinguishable from human speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/bytedance/seed/v2/mini","name":"Bytedance Seed V2 Mini","created_by":"fal","source":"official","description":" Seed 2.0 Mini is a high-performance multimodal model optimized for low latency and high concurrency.","status":"active","release_date":"2026-03-17","model_type":"other","page_url":"https://fal.run/fal-ai/bytedance/seed/v2/mini","tagline":" Seed 2.0 Mini is a high-performance multimodal model optimized for low latency and high concurrency.","capabilities":{"vision":true,"reasoning":true},"last_seen_at":"2026-03-18","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedance/v1/lite/image-to-video","name":"Seedance 1.0 Lite","created_by":"fal","source":"official","description":"Seedance 1.0 Lite","status":"active","release_date":"2025-06-13","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1/lite/image-to-video","tagline":"Seedance 1.0 Lite","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/seedance/v1/lite/reference-to-video","name":"Bytedance","created_by":"fal","source":"official","description":"Seedance lite reference-to-video allows the use of 1 to 4 images as reference to create a high-quality video.","status":"active","release_date":"2025-09-01","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1/lite/reference-to-video","tagline":"Seedance lite reference-to-video allows the use of 1 to 4 images as reference to create a high-quality video.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/seedance/v1/lite/text-to-video","name":"Seedance 1.0 Lite","created_by":"fal","source":"official","description":"Seedance 1.0 Lite","status":"active","release_date":"2025-06-13","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1/lite/text-to-video","tagline":"Seedance 1.0 Lite","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/seedance/v1/pro/fast/image-to-video","name":"Bytedance Seedance V1 Pro Fast Image To Video","created_by":"fal","source":"official","description":"Image to Video endpoint for Seedance 1.0 Pro Fast, a next-generation video model designed to deliver maximum performance at minimal cost","status":"active","release_date":"2025-10-24","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1/pro/fast/image-to-video","tagline":"Image to Video endpoint for Seedance 1.0 Pro Fast, a next-generation video model designed to deliver maximum performance at minimal cost","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedance/v1/pro/fast/text-to-video","name":"Bytedance Seedance V1 Pro Fast Text To Video","created_by":"fal","source":"official","description":"Text to Video endpoint for Seedance 1.0 Pro Fast, a next-generation video model designed to deliver maximum performance at minimal cost","status":"active","release_date":"2025-10-24","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1/pro/fast/text-to-video","tagline":"Text to Video endpoint for Seedance 1.0 Pro Fast, a next-generation video model designed to deliver maximum performance at minimal cost","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedance/v1/pro/image-to-video","name":"Seedance 1.0 Pro","created_by":"fal","source":"official","description":"Seedance 1.0 Pro, a high quality video generation model developed by Bytedance.","status":"active","release_date":"2025-06-16","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1/pro/image-to-video","tagline":"Seedance 1.0 Pro, a high quality video generation model developed by Bytedance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/seedance/v1/pro/text-to-video","name":"Seedance 1.0 Pro","created_by":"fal","source":"official","description":"Seedance 1.0 Pro, a high quality video generation model developed by Bytedance.","status":"active","release_date":"2025-06-16","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1/pro/text-to-video","tagline":"Seedance 1.0 Pro, a high quality video generation model developed by Bytedance.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/seedance/v1.5/pro/image-to-video","name":"Bytedance Seedance V1.5 Pro Image To Video","created_by":"fal","source":"official","description":"Generate videos with audio with Seedance 1.5 (supports start & end frame) ","status":"active","release_date":"2025-12-23","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1.5/pro/image-to-video","tagline":"Generate videos with audio with Seedance 1.5 (supports start & end frame) ","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedance/v1.5/pro/text-to-video","name":"Bytedance Seedance V1.5 Pro Text To Video","created_by":"fal","source":"official","description":"Generate videos with audio with Seedance 1.5","status":"active","release_date":"2025-12-23","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/seedance/v1.5/pro/text-to-video","tagline":"Generate videos with audio with Seedance 1.5","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedream/v3/text-to-image","name":"Bytedance","created_by":"fal","source":"official","description":"Seedream 3.0 is a bilingual (Chinese and English) text-to-image model that excels at text-to-image generation.","status":"active","release_date":"2025-06-10","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/seedream/v3/text-to-image","tagline":"Seedream 3.0 is a bilingual (Chinese and English) text-to-image model that excels at text-to-image generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/bytedance/seedream/v4/edit","name":"Bytedance Seedream V4 Edit","created_by":"fal","source":"official","description":"A new-generation image creation model ByteDance, Seedream 4.0 integrates image generation and image editing capabilities into a single, unified architecture.","status":"active","release_date":"2025-09-09","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/seedream/v4/edit","tagline":"A new-generation image creation model ByteDance, Seedream 4.0 integrates image generation and image editing capabilities into a single, unified architecture.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedream/v4/text-to-image","name":"Bytedance Seedream V4 Text To Image","created_by":"fal","source":"official","description":"A new-generation image creation model ByteDance, Seedream 4.0 integrates image generation and image editing capabilities into a single, unified architecture.","status":"active","release_date":"2025-09-09","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/seedream/v4/text-to-image","tagline":"A new-generation image creation model ByteDance, Seedream 4.0 integrates image generation and image editing capabilities into a single, unified architecture.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/bytedance/seedream/v4.5/edit","name":"Bytedance Seedream V4.5 Edit","created_by":"fal","source":"official","description":"A new-generation image creation model ByteDance, Seedream 4.5 integrates image generation and image editing capabilities into a single, unified architecture.","status":"active","release_date":"2025-12-03","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/seedream/v4.5/edit","tagline":"A new-generation image creation model ByteDance, Seedream 4.5 integrates image generation and image editing capabilities into a single, unified architecture.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedream/v4.5/text-to-image","name":"Bytedance Seedream V4.5 Text To Image","created_by":"fal","source":"official","description":"A new-generation image creation model ByteDance, Seedream 4.5 integrates image generation and image editing capabilities into a single, unified architecture.","status":"active","release_date":"2025-12-03","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/seedream/v4.5/text-to-image","tagline":"A new-generation image creation model ByteDance, Seedream 4.5 integrates image generation and image editing capabilities into a single, unified architecture.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedream/v5/lite/edit","name":"Bytedance Seedream V5 Lite Edit","created_by":"fal","source":"official","description":"Image editing endpoint for the fast Lite version of Seedream 5.0, supporting high quality intelligent image editing with multiple inputs.","status":"active","release_date":"2026-02-23","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/seedream/v5/lite/edit","tagline":"Image editing endpoint for the fast Lite version of Seedream 5.0, supporting high quality intelligent image editing with multiple inputs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-29","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/seedream/v5/lite/text-to-image","name":"Bytedance Seedream V5 Lite Text To Image","created_by":"fal","source":"official","description":"Text to Image endpoint for the fast Lite version of Seedream 5.0, supporting high quality intelligent text-to-image generation.","status":"active","release_date":"2026-02-23","model_type":"image","page_url":"https://fal.run/fal-ai/bytedance/seedream/v5/lite/text-to-image","tagline":"Text to Image endpoint for the fast Lite version of Seedream 5.0, supporting high quality intelligent text-to-image generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-27","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance-upscaler/upscale/video","name":"Bytedance Upscaler Upscale Video","created_by":"fal","source":"official","description":"Upscale videos with Bytedance's video upscaler.","status":"active","release_date":"2025-10-31","model_type":"other","page_url":"https://fal.run/fal-ai/bytedance-upscaler/upscale/video","tagline":"Upscale videos with Bytedance's video upscaler.","last_seen_at":"2026-04-28","last_updated":"2026-06-03"},{"id":"fal-ai/bytedance/video-stylize","name":"Bytedance","created_by":"fal","source":"official","description":"Transform your images into stylized videos using this workflow.","status":"active","release_date":"2025-08-12","model_type":"video","page_url":"https://fal.run/fal-ai/bytedance/video-stylize","tagline":"Transform your images into stylized videos using this workflow.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/calligrapher","name":"Calligrapher","created_by":"fal","source":"official","description":"Use the text and font retaining capabilities of calligrapher to modify texts on your books, clothes and many more.","status":"active","release_date":"2025-07-12","model_type":"image","page_url":"https://fal.run/fal-ai/calligrapher","tagline":"Use the text and font retaining capabilities of calligrapher to modify texts on your books, clothes and many more.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/cartoonify","name":"Cartoonify","created_by":"fal","source":"official","description":"Transform images into 3D cartoon artwork using an AI model that applies cartoon stylization while preserving the original image's composition and details.","status":"active","release_date":"2025-04-14","model_type":"image","page_url":"https://fal.run/fal-ai/cartoonify","tagline":"Transform images into 3D cartoon artwork using an AI model that applies cartoon stylization while preserving the original image's composition and details.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/cat-vton","name":"try-on","created_by":"fal","source":"official","description":"Image based high quality Virtual Try-On","status":"active","release_date":"2024-12-17","model_type":"image","page_url":"https://fal.run/fal-ai/cat-vton","tagline":"Image based high quality Virtual Try-On","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/ccsr","name":"CCSR Upscaler","created_by":"fal","source":"official","description":"SOTA Image Upscaler","status":"active","release_date":"2024-05-05","model_type":"image","page_url":"https://fal.run/fal-ai/ccsr","tagline":"SOTA Image Upscaler","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/chain-of-zoom","name":"Chain Of Zoom","created_by":"fal","source":"official","description":"Extreme Super-Resolution via Scale Autoregression and Preference Alignment","status":"active","release_date":"2025-06-18","model_type":"image","page_url":"https://fal.run/fal-ai/chain-of-zoom","tagline":"Extreme Super-Resolution via Scale Autoregression and Preference Alignment","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/chatterbox/speech-to-speech","name":"Chatterbox","created_by":"fal","source":"official","description":"Whether you're working on memes, videos, games, or AI agents, Chatterbox brings your content to life.","status":"active","release_date":"2025-06-01","model_type":"other","page_url":"https://fal.run/fal-ai/chatterbox/speech-to-speech","tagline":"Whether you're working on memes, videos, games, or AI agents, Chatterbox brings your content to life.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/chatterbox/text-to-speech/multilingual","name":"Chatterbox","created_by":"fal","source":"official","description":"Whether you're working on memes, videos, games, or AI agents, Chatterbox brings your content to life.","status":"active","release_date":"2025-09-04","model_type":"tts","page_url":"https://fal.run/fal-ai/chatterbox/text-to-speech/multilingual","tagline":"Whether you're working on memes, videos, games, or AI agents, Chatterbox brings your content to life.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/chatterbox/text-to-speech","name":"Chatterbox","created_by":"fal","source":"official","description":"Whether you're working on memes, videos, games, or AI agents, Chatterbox brings your content to life.","status":"active","release_date":"2025-06-01","model_type":"tts","page_url":"https://fal.run/fal-ai/chatterbox/text-to-speech","tagline":"Whether you're working on memes, videos, games, or AI agents, Chatterbox brings your content to life.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/chrono-edit-lora-gallery/paintbrush","name":"Chrono Edit Lora Gallery","created_by":"fal","source":"official","description":"You can make edits simply by drawing a quick sketch on the input image.","status":"active","release_date":"2025-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/chrono-edit-lora-gallery/paintbrush","tagline":"You can make edits simply by drawing a quick sketch on the input image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/chrono-edit-lora-gallery/upscaler","name":"Chrono Edit Lora Gallery","created_by":"fal","source":"official","description":"Upscales and cleans up the image.","status":"active","release_date":"2025-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/chrono-edit-lora-gallery/upscaler","tagline":"Upscales and cleans up the image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/chrono-edit-lora","name":"Chrono Edit Lora","created_by":"fal","source":"official","description":"LoRA endpoint for the Chrono Edit model.","status":"active","release_date":"2025-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/chrono-edit-lora","tagline":"LoRA endpoint for the Chrono Edit model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/chrono-edit","name":"Chrono Edit","created_by":"fal","source":"official","description":"NVIDIA's Logically Consistent and Physics-Aware Image Editing Model","status":"active","release_date":"2025-10-30","model_type":"image","page_url":"https://fal.run/fal-ai/chrono-edit","tagline":"NVIDIA's Logically Consistent and Physics-Aware Image Editing Model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/clarity-upscaler","name":"Clarity Upscaler","created_by":"fal","source":"official","description":"Clarity upscaler for upscaling images with high very fidelity.","status":"active","release_date":"2024-02-04","model_type":"image","page_url":"https://fal.run/fal-ai/clarity-upscaler","tagline":"Clarity upscaler for upscaling images with high very fidelity.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"fal-ai/codeformer","name":"CodeFormer","created_by":"fal","source":"official","description":"Fix distorted or blurred photos of people with CodeFormer.","status":"active","release_date":"2025-01-31","model_type":"image","page_url":"https://fal.run/fal-ai/codeformer","tagline":"Fix distorted or blurred photos of people with CodeFormer.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/cogvideox-5b/image-to-video","name":"CogVideoX-5B","created_by":"fal","source":"official","description":"Generate videos from images and prompts using CogVideoX-5B","status":"active","release_date":"2024-10-17","model_type":"video","page_url":"https://fal.run/fal-ai/cogvideox-5b/image-to-video","tagline":"Generate videos from images and prompts using CogVideoX-5B","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/cogvideox-5b/video-to-video","name":"CogVideoX-5B","created_by":"fal","source":"official","description":"Generate videos from videos and prompts using CogVideoX-5B","status":"active","release_date":"2024-10-17","model_type":"other","page_url":"https://fal.run/fal-ai/cogvideox-5b/video-to-video","tagline":"Generate videos from videos and prompts using CogVideoX-5B","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/cogvideox-5b","name":"CogVideoX-5B","created_by":"fal","source":"official","description":"Generate videos from prompts using CogVideoX-5B","status":"active","release_date":"2025-01-14","model_type":"video","parameters":5,"page_url":"https://fal.run/fal-ai/cogvideox-5b","tagline":"Generate videos from prompts using CogVideoX-5B","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/cogview4","name":"CogView","created_by":"fal","source":"official","description":"Generate high quality images from text prompts using CogView4.","status":"active","release_date":"2025-03-04","model_type":"image","page_url":"https://fal.run/fal-ai/cogview4","tagline":"Generate high quality images from text prompts using CogView4.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/cohere-transcribe","name":"Cohere Transcribe","created_by":"fal","source":"official","description":"Cohere Transcribe turns your business audio into accurate text, ready for search, analytics, and automation","status":"active","release_date":"2026-04-22","model_type":"transcription","page_url":"https://fal.run/fal-ai/cohere-transcribe","tagline":"Cohere Transcribe turns your business audio into accurate text, ready for search, analytics, and automation","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-05-12","last_updated":"2026-06-03"},{"id":"fal-ai/control-light","name":"ControlLight","created_by":"fal","source":"official","description":"ControlLight is a LoRA fine-tune of FLUX.2 [klein] 9B that enhances low-light images while preserving scene structure and fine details, with a single alpha parameter that gives continuous control over","status":"active","release_date":"2026-05-27","model_type":"image","page_url":"https://fal.run/fal-ai/control-light","tagline":"ControlLight is a LoRA fine-tune of FLUX.2 [klein] 9B that enhances low-light images while preserving scene structure and fine details, with a single alpha parameter that gives continuous control over","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-29","last_updated":"2026-06-03"},{"id":"fal-ai/controlfoley","name":"Controlfoley","created_by":"fal","source":"official","description":"Foley Control is a video-to-audio model that automatically generates synchronized sound effects for videos, using text prompts to shape the type of sound while matching the timing and action on screen","status":"active","release_date":"2026-05-05","model_type":"other","page_url":"https://fal.run/fal-ai/controlfoley","tagline":"Foley Control is a video-to-audio model that automatically generates synchronized sound effects for videos, using text prompts to shape the type of sound while matching the timing and action on screen","last_seen_at":"2026-05-22","last_updated":"2026-06-03"},{"id":"fal-ai/controlnext","name":"ControlNeXt SVD","created_by":"fal","source":"official","description":"Animate a reference image with a driving video using ControlNeXt.","status":"active","release_date":"2024-09-05","model_type":"other","page_url":"https://fal.run/fal-ai/controlnext","tagline":"Animate a reference image with a driving video using ControlNeXt.","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/cosmos-predict-2.5/distilled/text-to-video","name":"Cosmos Predict 2.5 2B Distilled","created_by":"fal","source":"official","description":"Generate video from text and videos using NVIDIA's 2B Cosmos Distilled Model","status":"active","release_date":"2026-02-24","model_type":"video","page_url":"https://fal.run/fal-ai/cosmos-predict-2.5/distilled/text-to-video","tagline":"Generate video from text and videos using NVIDIA's 2B Cosmos Distilled Model","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/cosmos-predict-2.5/image-to-video","name":"Cosmos Predict 2.5 2B","created_by":"fal","source":"official","description":"Generate video from text and images using NVIDIA's 2B Cosmos Post-Trained Model","status":"active","release_date":"2026-02-24","model_type":"video","page_url":"https://fal.run/fal-ai/cosmos-predict-2.5/image-to-video","tagline":"Generate video from text and images using NVIDIA's 2B Cosmos Post-Trained Model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/cosmos-predict-2.5/text-to-video","name":"Cosmos Predict 2.5 2B","created_by":"fal","source":"official","description":"Generate video from text using NVIDIA's 2B Cosmos Post-Trained Model","status":"active","release_date":"2026-02-24","model_type":"video","page_url":"https://fal.run/fal-ai/cosmos-predict-2.5/text-to-video","tagline":"Generate video from text using NVIDIA's 2B Cosmos Post-Trained Model","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/cosmos-predict-2.5/video-to-video","name":"Cosmos Predict 2.5 2B","created_by":"fal","source":"official","description":"Generate video from text and videos using NVIDIA's 2B Cosmos Post-Trained Model","status":"active","release_date":"2026-02-24","model_type":"other","page_url":"https://fal.run/fal-ai/cosmos-predict-2.5/video-to-video","tagline":"Generate video from text and videos using NVIDIA's 2B Cosmos Post-Trained Model","last_seen_at":"2026-02-24","last_updated":"2026-05-11"},{"id":"fal-ai/creatify/aurora","name":"Creatify Aurora","created_by":"fal","source":"official","description":"Generate high fidelity, studio quality videos of your avatar speaking or singing using the Aurora from Creatify team!","status":"active","release_date":"2025-12-11","model_type":"video","page_url":"https://fal.run/fal-ai/creatify/aurora","tagline":"Generate high fidelity, studio quality videos of your avatar speaking or singing using the Aurora from Creatify team!","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/creative-upscaler","name":"Creative Upscaler","created_by":"fal","source":"official","description":"Create creative upscaled images.","status":"active","release_date":"2024-02-27","model_type":"image","page_url":"https://fal.run/fal-ai/creative-upscaler","tagline":"Create creative upscaled images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/csm-1b","name":"CSM-1B","created_by":"fal","source":"official","description":"CSM (Conversational Speech Model) is a speech generation model from Sesame that generates RVQ audio codes from text and audio inputs.","status":"active","release_date":"2025-03-13","model_type":"other","parameters":1,"page_url":"https://fal.run/fal-ai/csm-1b","tagline":"CSM (Conversational Speech Model) is a speech generation model from Sesame that generates RVQ audio codes from text and audio inputs.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/davinci-magihuman","name":"Davinci Magihuman","created_by":"fal","source":"official","description":"Expressive facial performance, natural speech-expression coordination, realistic body motion, and accurate audio-video synchronization with DaVinci-MagiHuman model","status":"active","release_date":"2026-03-25","model_type":"video","page_url":"https://fal.run/fal-ai/davinci-magihuman","tagline":"Expressive facial performance, natural speech-expression coordination, realistic body motion, and accurate audio-video synchronization with DaVinci-MagiHuman model","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/ddcolor","name":"DDColor","created_by":"fal","source":"official","description":"Bring colors into old or new black and white photos with DDColor.","status":"active","release_date":"2025-02-26","model_type":"image","page_url":"https://fal.run/fal-ai/ddcolor","tagline":"Bring colors into old or new black and white photos with DDColor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/decart/lucy-5b/image-to-video","name":"Decart","created_by":"fal","source":"official","description":"Lucy-5B is a model that can create 5-second I2V videos in under 5 seconds, achieving >1x RTF end-to-end","status":"active","release_date":"2025-08-28","model_type":"video","page_url":"https://fal.run/fal-ai/decart/lucy-5b/image-to-video","tagline":"Lucy-5B is a model that can create 5-second I2V videos in under 5 seconds, achieving >1x RTF end-to-end","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/deepfilternet3","name":"DeepFilterNet 3","created_by":"fal","source":"official","description":"Enhance speech audio by removing background noise and upsampling to 48KHz","status":"active","release_date":"2026-01-07","model_type":"other","page_url":"https://fal.run/fal-ai/deepfilternet3","tagline":"Enhance speech audio by removing background noise and upsampling to 48KHz","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/demucs","name":"Demucs","created_by":"fal","source":"official","description":"SOTA stemming model for voice, drums, bass, guitar and more.","status":"active","release_date":"2025-10-27","model_type":"other","page_url":"https://fal.run/fal-ai/demucs","tagline":"SOTA stemming model for voice, drums, bass, guitar and more.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/depth-anything-video","name":"Depth Anything Video","created_by":"fal","source":"official","description":"Generates depth maps from video using Video Depth Anything (CVPR 2025).","status":"active","release_date":"2026-03-02","model_type":"other","page_url":"https://fal.run/fal-ai/depth-anything-video","tagline":"Generates depth maps from video using Video Depth Anything (CVPR 2025).","last_seen_at":"2026-03-02","last_updated":"2026-05-11"},{"id":"fal-ai/dia-tts/voice-clone","name":"Dia Tts","created_by":"fal","source":"official","description":"Clone dialog voices from a sample audio and generate dialogs from text prompts using the Dia TTS which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-04-22","model_type":"other","page_url":"https://fal.run/fal-ai/dia-tts/voice-clone","tagline":"Clone dialog voices from a sample audio and generate dialogs from text prompts using the Dia TTS which leverages advanced AI techniques to create high-quality text-to-speech.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/dia-tts","name":"Dia","created_by":"fal","source":"official","description":"Dia directly generates realistic dialogue from transcripts.","status":"active","release_date":"2025-04-22","model_type":"tts","page_url":"https://fal.run/fal-ai/dia-tts","tagline":"Dia directly generates realistic dialogue from transcripts.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/diffrhythm","name":"DiffRhythm: Lyrics to Song","created_by":"fal","source":"official","description":"DiffRhythm is a blazing fast model for transforming lyrics into full songs.","status":"active","release_date":"2025-03-04","model_type":"other","page_url":"https://fal.run/fal-ai/diffrhythm","tagline":"DiffRhythm is a blazing fast model for transforming lyrics into full songs.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/diffusion-edge","name":"DiffusionEdge","created_by":"fal","source":"official","description":"Diffusion based high quality edge detection","status":"active","release_date":"2024-01-08","model_type":"image","page_url":"https://fal.run/fal-ai/diffusion-edge","tagline":"Diffusion based high quality edge detection","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/docres/dewarp","name":"DocRes-dewarp","created_by":"fal","source":"official","description":"Enhance wraped, folded documents with the superior quality of docres for sharper, clearer results.","status":"active","release_date":"2025-03-03","model_type":"image","page_url":"https://fal.run/fal-ai/docres/dewarp","tagline":"Enhance wraped, folded documents with the superior quality of docres for sharper, clearer results.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/docres","name":"DocRes","created_by":"fal","source":"official","description":"Enhance low-resolution, blur, shadowed documents with the superior quality of docres for sharper, clearer results.","status":"active","release_date":"2025-03-03","model_type":"image","page_url":"https://fal.run/fal-ai/docres","tagline":"Enhance low-resolution, blur, shadowed documents with the superior quality of docres for sharper, clearer results.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/drct-super-resolution","name":"DRCT-Super-Resolution","created_by":"fal","source":"official","description":"Upscale your images with DRCT-Super-Resolution.","status":"active","release_date":"2025-02-24","model_type":"image","page_url":"https://fal.run/fal-ai/drct-super-resolution","tagline":"Upscale your images with DRCT-Super-Resolution.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/dreamo","name":"DreamO","created_by":"fal","source":"official","description":"DreamO is an image customization framework designed to support a wide range of tasks while facilitating seamless integration of multiple conditions.","status":"active","release_date":"2025-05-19","model_type":"image","page_url":"https://fal.run/fal-ai/dreamo","tagline":"DreamO is an image customization framework designed to support a wide range of tasks while facilitating seamless integration of multiple conditions.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/dreamomni2/edit","name":"DreamOmni2","created_by":"fal","source":"official","description":"DreamOmni2 is a unified multimodal model for text and image guided image editing.","status":"active","release_date":"2025-10-10","model_type":"image","page_url":"https://fal.run/fal-ai/dreamomni2/edit","tagline":"DreamOmni2 is a unified multimodal model for text and image guided image editing.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/dreamshaper","name":"Dreamshaper","created_by":"fal","source":"official","description":"Dreamshaper model.","status":"active","release_date":"2024-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/dreamshaper","tagline":"Dreamshaper model.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/dubbing","name":"Dubbing","created_by":"fal","source":"official","description":"This endpoint delivers seamlessly localized videos by generating lip-synced dubs in multiple languages, ensuring natural and immersive multilingual experiences","status":"active","release_date":"2024-12-20","model_type":"other","page_url":"https://fal.run/fal-ai/dubbing","tagline":"This endpoint delivers seamlessly localized videos by generating lip-synced dubs in multiple languages, ensuring natural and immersive multilingual experiences","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/dwpose/video","name":"DWPose Pose Prediction","created_by":"fal","source":"official","description":"Predict poses from videos.","status":"active","release_date":"2025-06-15","model_type":"other","page_url":"https://fal.run/fal-ai/dwpose/video","tagline":"Predict poses from videos.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/dwpose","name":"DWPose Pose Prediction","created_by":"fal","source":"official","description":"Predict poses from images.","status":"active","release_date":"2024-06-01","model_type":"image","page_url":"https://fal.run/fal-ai/dwpose","tagline":"Predict poses from images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/echomimic-v3","name":"EchoMimic V3","created_by":"fal","source":"official","description":"EchoMimic V3 generates a talking avatar model from a picture, audio and text prompt.","status":"active","release_date":"2025-08-13","model_type":"other","page_url":"https://fal.run/fal-ai/echomimic-v3","tagline":"EchoMimic V3 generates a talking avatar model from a picture, audio and text prompt.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/editto","name":"Editto","created_by":"fal","source":"official","description":"Edit videos using instruction-based prompting using Editto model!","status":"active","release_date":"2025-11-12","model_type":"other","page_url":"https://fal.run/fal-ai/editto","tagline":"Edit videos using instruction-based prompting using Editto model!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/elevenlabs/audio-isolation","name":"ElevenLabs Audio Isolation","created_by":"fal","source":"official","description":"Isolate audio tracks using ElevenLabs advanced audio isolation technology.","status":"active","release_date":"2025-02-27","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/audio-isolation","tagline":"Isolate audio tracks using ElevenLabs advanced audio isolation technology.","capabilities":{"streaming":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/elevenlabs/dubbing","name":"ElevenLabs Dubbing","created_by":"fal","source":"official","description":"Generate dubbed videos or audios using ElevenLabs Dubbing feature!","status":"active","release_date":"2026-01-14","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/dubbing","tagline":"Generate dubbed videos or audios using ElevenLabs Dubbing feature!","last_seen_at":"2026-05-27","last_updated":"2026-06-03"},{"id":"fal-ai/elevenlabs/music","name":"Elevenlabs Music","created_by":"fal","source":"official","description":"Generate high quality, realistic music with fine controls using Elevenlabs Music!","status":"active","release_date":"2025-12-22","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/music","tagline":"Generate high quality, realistic music with fine controls using Elevenlabs Music!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/elevenlabs/sound-effects/v2","name":"Elevenlabs Sound Effects V2","created_by":"fal","source":"official","description":"Generate sound effects using ElevenLabs advanced sound effects model.","status":"active","release_date":"2025-09-02","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/sound-effects/v2","tagline":"Generate sound effects using ElevenLabs advanced sound effects model.","capabilities":{"streaming":true},"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/elevenlabs/speech-to-text/scribe-v2","name":"ElevenLabs Speech to Text - Scribe V2","created_by":"fal","source":"official","description":"Use Scribe-V2 from ElevenLabs to do blazingly fast speech to text inferences!","status":"active","release_date":"2026-01-14","model_type":"transcription","page_url":"https://fal.run/fal-ai/elevenlabs/speech-to-text/scribe-v2","tagline":"Use Scribe-V2 from ElevenLabs to do blazingly fast speech to text inferences!","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/elevenlabs/speech-to-text","name":"ElevenLabs Speech to Text","created_by":"fal","source":"official","description":"Generate text from speech using ElevenLabs advanced speech-to-text model.","status":"active","release_date":"2025-02-27","model_type":"transcription","page_url":"https://fal.run/fal-ai/elevenlabs/speech-to-text","tagline":"Generate text from speech using ElevenLabs advanced speech-to-text model.","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/elevenlabs/text-to-dialogue/eleven-v3","name":"Elevenlabs","created_by":"fal","source":"official","description":"Generate realistic audio dialogues using Eleven-v3 from ElevenLabs.","status":"active","release_date":"2025-09-09","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/text-to-dialogue/eleven-v3","tagline":"Generate realistic audio dialogues using Eleven-v3 from ElevenLabs.","capabilities":{"streaming":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/elevenlabs/tts/eleven-v3","name":"Elevenlabs Tts Eleven V3","created_by":"fal","source":"official","description":"Generate text-to-speech audio using Eleven-v3 from ElevenLabs.","status":"active","release_date":"2025-08-20","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/tts/eleven-v3","tagline":"Generate text-to-speech audio using Eleven-v3 from ElevenLabs.","capabilities":{"streaming":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/elevenlabs/tts/multilingual-v2","name":"ElevenLabs TTS Multilingual v2","created_by":"fal","source":"official","description":"Generate multilingual text-to-speech audio using ElevenLabs TTS Multilingual v2.","status":"active","release_date":"2025-02-27","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/tts/multilingual-v2","tagline":"Generate multilingual text-to-speech audio using ElevenLabs TTS Multilingual v2.","capabilities":{"streaming":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/elevenlabs/tts/turbo-v2.5","name":"ElevenLabs TTS Turbo v2.5","created_by":"fal","source":"official","description":"Generate high-speed text-to-speech audio using ElevenLabs TTS Turbo v2.5.","status":"active","release_date":"2025-02-27","model_type":"tts","page_url":"https://fal.run/fal-ai/elevenlabs/tts/turbo-v2.5","tagline":"Generate high-speed text-to-speech audio using ElevenLabs TTS Turbo v2.5.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/elevenlabs/voice-changer","name":"ElevenLabs Voice Changer","created_by":"fal","source":"official","description":"Change the voices in your audios with voices in ElevenLabs!","status":"active","release_date":"2026-01-14","model_type":"other","page_url":"https://fal.run/fal-ai/elevenlabs/voice-changer","tagline":"Change the voices in your audios with voices in ElevenLabs!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/emu-3.5-image/edit-image","name":"Emu 3.5 Image","created_by":"fal","source":"official","description":"Edit images with a text prompt using Emu 3.5 Image","status":"active","release_date":"2025-11-01","model_type":"image","page_url":"https://fal.run/fal-ai/emu-3.5-image/edit-image","tagline":"Edit images with a text prompt using Emu 3.5 Image","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/emu-3.5-image/text-to-image","name":"Emu 3.5 Image","created_by":"fal","source":"official","description":"Generate images from text using Emu 3.5 Image","status":"active","release_date":"2025-11-01","model_type":"image","page_url":"https://fal.run/fal-ai/emu-3.5-image/text-to-image","tagline":"Generate images from text using Emu 3.5 Image","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/era-3d","name":"Era 3D","created_by":"fal","source":"official","description":"A powerful image to novel multiview model with normals.","status":"active","release_date":"2024-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/era-3d","tagline":"A powerful image to novel multiview model with normals.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/ernie-image/lora/turbo","name":"Ernie Image Lora Turbo","created_by":"fal","source":"official","description":"High-quality text-to-image model by Baidu.","status":"active","release_date":"2026-04-16","model_type":"image","page_url":"https://fal.run/fal-ai/ernie-image/lora/turbo","tagline":"High-quality text-to-image model by Baidu.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/ernie-image/lora","name":"Ernie Image Lora","created_by":"fal","source":"official","description":"High-quality text-to-image model by Baidu.","status":"active","release_date":"2026-04-16","model_type":"image","page_url":"https://fal.run/fal-ai/ernie-image/lora","tagline":"High-quality text-to-image model by Baidu.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/ernie-image-trainer","name":"ERNIE-Image Trainer","created_by":"fal","source":"official","description":"LoRA trainer for ERNIE-Image, Baidu's powerful 8B-parameter text-to-image model.","status":"active","release_date":"2026-04-15","model_type":"other","page_url":"https://fal.run/fal-ai/ernie-image-trainer","tagline":"LoRA trainer for ERNIE-Image, Baidu's powerful 8B-parameter text-to-image model.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ernie-image/turbo","name":"Ernie Image Turbo","created_by":"fal","source":"official","description":"High-quality text-to-image model by Baidu.","status":"active","release_date":"2026-04-13","model_type":"image","page_url":"https://fal.run/fal-ai/ernie-image/turbo","tagline":"High-quality text-to-image model by Baidu.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/ernie-image","name":"Ernie Image","created_by":"fal","source":"official","description":"High-quality text-to-image model by Baidu.","status":"active","release_date":"2026-04-10","model_type":"image","page_url":"https://fal.run/fal-ai/ernie-image","tagline":"High-quality text-to-image model by Baidu.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-16","last_updated":"2026-06-03"},{"id":"fal-ai/esrgan","name":"Upscale Images","created_by":"fal","source":"official","description":"Upscale images by a given factor.","status":"active","release_date":"2023-10-30","model_type":"image","page_url":"https://fal.run/fal-ai/esrgan","tagline":"Upscale images by a given factor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/evf-sam","name":"EVF-SAM2 Segmentation","created_by":"fal","source":"official","description":"EVF-SAM2 combines natural language understanding with advanced segmentation capabilities, allowing you to precisely mask image regions using intuitive positive and negative text prompts.","status":"active","release_date":"2025-02-26","model_type":"image","page_url":"https://fal.run/fal-ai/evf-sam","tagline":"EVF-SAM2 combines natural language understanding with advanced segmentation capabilities, allowing you to precisely mask image regions using intuitive positive and negative text prompts.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/f-lite/standard","name":"F Lite","created_by":"fal","source":"official","description":"F Lite is a 10B parameter diffusion model created by Fal and Freepik, trained exclusively on copyright-safe and SFW content.","status":"active","release_date":"2025-04-28","model_type":"image","page_url":"https://fal.run/fal-ai/f-lite/standard","tagline":"F Lite is a 10B parameter diffusion model created by Fal and Freepik, trained exclusively on copyright-safe and SFW content.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/f-lite/texture","name":"F Lite (texture mode)","created_by":"fal","source":"official","description":"F Lite is a 10B parameter diffusion model created by Fal and Freepik, trained exclusively on copyright-safe and SFW content.","status":"active","release_date":"2025-04-28","model_type":"image","page_url":"https://fal.run/fal-ai/f-lite/texture","tagline":"F Lite is a 10B parameter diffusion model created by Fal and Freepik, trained exclusively on copyright-safe and SFW content.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/f5-tts","name":"F5 TTS","created_by":"fal","source":"official","description":"F5 TTS","status":"active","release_date":"2024-10-17","model_type":"other","page_url":"https://fal.run/fal-ai/f5-tts","tagline":"F5 TTS","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/face-to-sticker","name":"Face to Sticker","created_by":"fal","source":"official","description":"Create stickers from faces.","status":"active","release_date":"2024-03-11","model_type":"image","page_url":"https://fal.run/fal-ai/face-to-sticker","tagline":"Create stickers from faces.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/fashn/tryon/v1.5","name":"FASHN Virtual Try-On V1.5","created_by":"fal","source":"official","description":"FASHN v1.5 delivers precise virtual try-on capabilities, accurately rendering garment details like text and patterns at 576x864 resolution from both on-model and flat-lay photo references.","status":"active","release_date":"2025-04-21","model_type":"image","page_url":"https://fal.run/fal-ai/fashn/tryon/v1.5","tagline":"FASHN v1.5 delivers precise virtual try-on capabilities, accurately rendering garment details like text and patterns at 576x864 resolution from both on-model and flat-lay photo references.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fashn/tryon/v1.6","name":"FASHN Virtual Try-On V1.6","created_by":"fal","source":"official","description":"FASHN v1.6 delivers precise virtual try-on capabilities, accurately rendering garment details like text and patterns at 864x1296 resolution from both on-model and flat-lay photo references.","status":"active","release_date":"2025-06-24","model_type":"image","page_url":"https://fal.run/fal-ai/fashn/tryon/v1.6","tagline":"FASHN v1.6 delivers precise virtual try-on capabilities, accurately rendering garment details like text and patterns at 864x1296 resolution from both on-model and flat-lay photo references.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-animatediff/text-to-video","name":"AnimateDiff","created_by":"fal","source":"official","description":"Animate your ideas!","status":"active","release_date":"2024-02-21","model_type":"video","page_url":"https://fal.run/fal-ai/fast-animatediff/text-to-video","tagline":"Animate your ideas!","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-animatediff/turbo/text-to-video","name":"AnimateDiff Turbo","created_by":"fal","source":"official","description":"Animate your ideas in lightning speed!","status":"active","release_date":"2024-02-13","model_type":"video","page_url":"https://fal.run/fal-ai/fast-animatediff/turbo/text-to-video","tagline":"Animate your ideas in lightning speed!","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-animatediff/turbo/video-to-video","name":"AnimateDiff Turbo","created_by":"fal","source":"official","description":"Re-animate your videos in lightning speed!","status":"active","release_date":"2024-02-13","model_type":"other","page_url":"https://fal.run/fal-ai/fast-animatediff/turbo/video-to-video","tagline":"Re-animate your videos in lightning speed!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-animatediff/video-to-video","name":"AnimateDiff","created_by":"fal","source":"official","description":"Re-animate your videos!","status":"active","release_date":"2024-02-13","model_type":"other","page_url":"https://fal.run/fal-ai/fast-animatediff/video-to-video","tagline":"Re-animate your videos!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-fooocus-sdxl/image-to-image","name":"Fooocus","created_by":"fal","source":"official","description":"Fooocus extreme speed mode as a standalone app.","status":"active","release_date":"2024-03-13","model_type":"image","page_url":"https://fal.run/fal-ai/fast-fooocus-sdxl/image-to-image","tagline":"Fooocus extreme speed mode as a standalone app.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/fast-fooocus-sdxl","name":"Fooocus","created_by":"fal","source":"official","description":"Fooocus extreme speed mode as a standalone app.","status":"active","release_date":"2024-02-16","model_type":"image","page_url":"https://fal.run/fal-ai/fast-fooocus-sdxl","tagline":"Fooocus extreme speed mode as a standalone app.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/fast-lcm-diffusion/image-to-image","name":"Latent Consistency Models (v1.5/XL)","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-02-19","model_type":"image","page_url":"https://fal.run/fal-ai/fast-lcm-diffusion/image-to-image","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/fast-lcm-diffusion/inpainting","name":"Latent Consistency Models (v1.5/XL)","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-02-19","model_type":"image","page_url":"https://fal.run/fal-ai/fast-lcm-diffusion/inpainting","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/fast-lcm-diffusion","name":"Latent Consistency Models (v1.5/XL)","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-02-19","model_type":"image","page_url":"https://fal.run/fal-ai/fast-lcm-diffusion","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/fast-lightning-sdxl/image-to-image","name":"Stable Diffusion XL Lightning","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/fast-lightning-sdxl/image-to-image","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-lightning-sdxl/inpainting","name":"Stable Diffusion XL Lightning","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/fast-lightning-sdxl/inpainting","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-lightning-sdxl","name":"Stable Diffusion XL Lightning","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-04-11","model_type":"image","page_url":"https://fal.run/fal-ai/fast-lightning-sdxl","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-sdxl-controlnet-canny/image-to-image","name":"ControlNet SDXL","created_by":"fal","source":"official","description":"Generate Images with ControlNet.","status":"active","release_date":"2023-12-01","model_type":"image","page_url":"https://fal.run/fal-ai/fast-sdxl-controlnet-canny/image-to-image","tagline":"Generate Images with ControlNet.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/fast-sdxl-controlnet-canny/inpainting","name":"ControlNet SDXL","created_by":"fal","source":"official","description":"Generate Images with ControlNet.","status":"active","release_date":"2023-12-01","model_type":"image","page_url":"https://fal.run/fal-ai/fast-sdxl-controlnet-canny/inpainting","tagline":"Generate Images with ControlNet.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/fast-sdxl-controlnet-canny","name":"ControlNet SDXL","created_by":"fal","source":"official","description":"Generate Images with ControlNet.","status":"active","release_date":"2024-02-28","model_type":"image","page_url":"https://fal.run/fal-ai/fast-sdxl-controlnet-canny","tagline":"Generate Images with ControlNet.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/fast-sdxl/image-to-image","name":"Stable Diffusion XL","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-04-16","model_type":"image","page_url":"https://fal.run/fal-ai/fast-sdxl/image-to-image","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-sdxl/inpainting","name":"Stable Diffusion XL","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-04-16","model_type":"image","page_url":"https://fal.run/fal-ai/fast-sdxl/inpainting","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-sdxl","name":"Stable Diffusion XL","created_by":"fal","source":"official","description":"Run SDXL at the speed of light","status":"active","release_date":"2024-06-12","model_type":"image","page_url":"https://fal.run/fal-ai/fast-sdxl","tagline":"Run SDXL at the speed of light","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-svd-lcm/text-to-video","name":"Stable Video Diffusion Turbo","created_by":"fal","source":"official","description":"Generate short video clips from your images using SVD v1.1 at Lightning Speed","status":"active","release_date":"2024-06-03","model_type":"video","page_url":"https://fal.run/fal-ai/fast-svd-lcm/text-to-video","tagline":"Generate short video clips from your images using SVD v1.1 at Lightning Speed","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-svd-lcm","name":"Stable Video Diffusion Turbo","created_by":"fal","source":"official","description":"Generate short video clips from your images using SVD v1.1 at Lightning Speed","status":"active","release_date":"2024-02-13","model_type":"video","page_url":"https://fal.run/fal-ai/fast-svd-lcm","tagline":"Generate short video clips from your images using SVD v1.1 at Lightning Speed","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fast-svd/text-to-video","name":"Stable Video Diffusion","created_by":"fal","source":"official","description":"Generate short video clips from your prompts using SVD v1.1","status":"active","release_date":"2024-09-16","model_type":"video","page_url":"https://fal.run/fal-ai/fast-svd/text-to-video","tagline":"Generate short video clips from your prompts using SVD v1.1","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/compose","name":"FFmpeg API Compose","created_by":"fal","source":"official","description":"Compose videos from multiple media sources using FFmpeg API.","status":"active","release_date":"2025-01-22","model_type":"other","page_url":"https://fal.run/fal-ai/ffmpeg-api/compose","tagline":"Compose videos from multiple media sources using FFmpeg API.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/extract-frame","name":"Ffmpeg Api","created_by":"fal","source":"official","description":"ffmpeg endpoint for first, middle and last frame extraction from videos","status":"active","release_date":"2025-06-09","model_type":"image","page_url":"https://fal.run/fal-ai/ffmpeg-api/extract-frame","tagline":"ffmpeg endpoint for first, middle and last frame extraction from videos","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/images-to-video","name":"Ffmpeg Api Images to Video","created_by":"fal","source":"official","description":"A fal.ai endpoint that stitches an ordered list of images into an MP4 video by holding each image for a specified number of frames at a configurable frame rate","status":"active","release_date":"2026-05-05","model_type":"video","page_url":"https://fal.run/fal-ai/ffmpeg-api/images-to-video","tagline":"A fal.ai endpoint that stitches an ordered list of images into an MP4 video by holding each image for a specified number of frames at a configurable frame rate","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-05-05","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/loudnorm","name":"Ffmpeg Api","created_by":"fal","source":"official","description":"Get EBU R128 loudness normalization from audio files using FFmpeg API.","status":"active","release_date":"2025-07-08","model_type":"other","page_url":"https://fal.run/fal-ai/ffmpeg-api/loudnorm","tagline":"Get EBU R128 loudness normalization from audio files using FFmpeg API.","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/merge-audio-video","name":"Ffmpeg Api Merge Audio-Video","created_by":"fal","source":"official","description":"Merge videos with standalone audio files or audio from video files.","status":"active","release_date":"2025-06-09","model_type":"other","page_url":"https://fal.run/fal-ai/ffmpeg-api/merge-audio-video","tagline":"Merge videos with standalone audio files or audio from video files.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/merge-audios","name":"FFmpeg API [Merge Audios]","created_by":"fal","source":"official","description":"Merge audios into a single audio using FFmpeg API!","status":"active","release_date":"2025-12-23","model_type":"other","page_url":"https://fal.run/fal-ai/ffmpeg-api/merge-audios","tagline":"Merge audios into a single audio using FFmpeg API!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/merge-videos","name":"Ffmpeg Api","created_by":"fal","source":"official","description":"Use ffmpeg capabilities to merge 2 or more videos.","status":"active","release_date":"2025-08-12","model_type":"other","page_url":"https://fal.run/fal-ai/ffmpeg-api/merge-videos","tagline":"Use ffmpeg capabilities to merge 2 or more videos.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ffmpeg-api/metadata","name":"FFmpeg API Metadata","created_by":"fal","source":"official","description":"Get encoding metadata from video and audio files using FFmpeg API.","status":"active","release_date":"2025-01-22","model_type":"other","page_url":"https://fal.run/fal-ai/ffmpeg-api/metadata","tagline":"Get encoding metadata from video and audio files using FFmpeg API.","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ffmpeg-api/waveform","name":"FFmpeg API Waveform","created_by":"fal","source":"official","description":"Get waveform data from audio files using FFmpeg API.","status":"active","release_date":"2025-01-22","model_type":"other","page_url":"https://fal.run/fal-ai/ffmpeg-api/waveform","tagline":"Get waveform data from audio files using FFmpeg API.","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/film/video","name":"FILM","created_by":"fal","source":"official","description":"Interpolate videos with FILM - Frame Interpolation for Large Motion","status":"active","release_date":"2025-07-22","model_type":"other","page_url":"https://fal.run/fal-ai/film/video","tagline":"Interpolate videos with FILM - Frame Interpolation for Large Motion","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/film","name":"FILM","created_by":"fal","source":"official","description":"Interpolate images with FILM - Frame Interpolation for Large Motion","status":"active","release_date":"2025-07-22","model_type":"image","page_url":"https://fal.run/fal-ai/film","tagline":"Interpolate images with FILM - Frame Interpolation for Large Motion","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/finegrain-eraser/bbox","name":"Finegrain Eraser Bbox","created_by":"fal","source":"official","description":"Finegrain Eraser removes any object selected with a bounding box—along with its shadows, reflections, and lighting artifacts—seamlessly reconstructing the scene with contextually accurate content.","status":"active","release_date":"2025-04-09","model_type":"image","page_url":"https://fal.run/fal-ai/finegrain-eraser/bbox","tagline":"Finegrain Eraser removes any object selected with a bounding box—along with its shadows, reflections, and lighting artifacts—seamlessly reconstructing the scene with contextually accurate content.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/finegrain-eraser/mask","name":"Finegrain Eraser Mask","created_by":"fal","source":"official","description":"Finegrain Eraser removes any object selected with a mask—along with its shadows, reflections, and lighting artifacts—seamlessly reconstructing the scene with contextually accurate content.","status":"active","release_date":"2025-04-10","model_type":"image","page_url":"https://fal.run/fal-ai/finegrain-eraser/mask","tagline":"Finegrain Eraser removes any object selected with a mask—along with its shadows, reflections, and lighting artifacts—seamlessly reconstructing the scene with contextually accurate content.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/finegrain-eraser","name":"Finegrain Eraser","created_by":"fal","source":"official","description":"Finegrain Eraser removes objects—along with their shadows, reflections, and lighting artifacts—using only natural language, seamlessly filling the scene with contextually accurate content.","status":"active","release_date":"2025-04-09","model_type":"image","page_url":"https://fal.run/fal-ai/finegrain-eraser","tagline":"Finegrain Eraser removes objects—along with their shadows, reflections, and lighting artifacts—using only natural language, seamlessly filling the scene with contextually accurate content.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/firered-image-edit-v1.1","name":"Firered Image Edit V1.1","created_by":"fal","source":"official","description":"FireRed Image Edit v1.1 is an updated version of FireRed Image Edit, with improved image editing capabilities.","status":"active","release_date":"2026-03-05","model_type":"image","page_url":"https://fal.run/fal-ai/firered-image-edit-v1.1","tagline":"FireRed Image Edit v1.1 is an updated version of FireRed Image Edit, with improved image editing capabilities.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-05","last_updated":"2026-05-11"},{"id":"fal-ai/firered-image-edit","name":"Firered Image Edit","created_by":"fal","source":"official","description":"FireRed Image Edit is FireRed's state of the art open source editing model, re-trained from Qwen Image Edit 2509.","status":"active","release_date":"2026-02-19","model_type":"image","page_url":"https://fal.run/fal-ai/firered-image-edit","tagline":"FireRed Image Edit is FireRed's state of the art open source editing model, re-trained from Qwen Image Edit 2509.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-10","last_updated":"2026-06-18"},{"id":"fal-ai/flashhead","name":"Flashhead","created_by":"fal","source":"official","description":"SoulX-FlashHead is a unified 1.3B-parameter framework designed for high-fidelity, infinite-length, and real-time streaming portrait video generation.","status":"active","release_date":"2026-03-12","model_type":"video","page_url":"https://fal.run/fal-ai/flashhead","tagline":"SoulX-FlashHead is a unified 1.3B-parameter framework designed for high-fidelity, infinite-length, and real-time streaming portrait video generation.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/flashtalk","name":"Flashtalk","created_by":"fal","source":"official","description":"Audio-driven talking avatar generation powered by the SoulX-FlashTalk 14B model.","status":"active","release_date":"2026-03-12","model_type":"other","page_url":"https://fal.run/fal-ai/flashtalk","tagline":"Audio-driven talking avatar generation powered by the SoulX-FlashTalk 14B model.","last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/flashvsr/upscale/video","name":"Flashvsr","created_by":"fal","source":"official","description":"Upscale your videos using FlashVSR with the fastest speeds!","status":"active","release_date":"2025-11-11","model_type":"other","page_url":"https://fal.run/fal-ai/flashvsr/upscale/video","tagline":"Upscale your videos using FlashVSR with the fastest speeds!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/caption-to-phrase-grounding","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/caption-to-phrase-grounding","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/caption","name":"Florence 2 Large Caption","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"other","page_url":"https://fal.run/fal-ai/florence-2-large/caption","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/florence-2-large/dense-region-caption","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/dense-region-caption","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/detailed-caption","name":"Florence 2 Large Detailed Caption","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"other","page_url":"https://fal.run/fal-ai/florence-2-large/detailed-caption","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/florence-2-large/more-detailed-caption","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"other","page_url":"https://fal.run/fal-ai/florence-2-large/more-detailed-caption","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/object-detection","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/object-detection","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/ocr-with-region","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/ocr-with-region","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/ocr","name":"Florence 2 Large OCR","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"other","page_url":"https://fal.run/fal-ai/florence-2-large/ocr","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/florence-2-large/open-vocabulary-detection","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/open-vocabulary-detection","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/referring-expression-segmentation","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/referring-expression-segmentation","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/region-proposal","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/region-proposal","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/region-to-category","name":"Florence 2 Large Region To Category","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"other","page_url":"https://fal.run/fal-ai/florence-2-large/region-to-category","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/florence-2-large/region-to-description","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"other","page_url":"https://fal.run/fal-ai/florence-2-large/region-to-description","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/florence-2-large/region-to-segmentation","name":"Florence-2 Large","created_by":"fal","source":"official","description":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","status":"active","release_date":"2024-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/florence-2-large/region-to-segmentation","tagline":"Florence-2 is an advanced vision foundation model that uses a prompt-based approach to handle a wide range of vision and vision-language tasks","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flowedit","name":"Flow-Edit","created_by":"fal","source":"official","description":"The model provides you high quality image editing capabilities.","status":"active","release_date":"2025-02-14","model_type":"image","page_url":"https://fal.run/fal-ai/flowedit","tagline":"The model provides you high quality image editing capabilities.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-1/dev/image-to-image","name":"FLUX.1 [dev]","created_by":"fal","source":"official","description":"FLUX.1 [dev] is a 12 billion parameter flow transformer that generates high-quality images from text.","status":"active","release_date":"2025-06-02","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/dev/image-to-image","tagline":"FLUX.1 [dev] is a 12 billion parameter flow transformer that generates high-quality images from text.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-1/dev/redux","name":"FLUX.1 [dev] Redux","created_by":"fal","source":"official","description":"FLUX.1 [dev] Redux is a high-performance endpoint for the FLUX.1 [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with ","status":"active","release_date":"2025-06-02","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/dev/redux","tagline":"FLUX.1 [dev] Redux is a high-performance endpoint for the FLUX.1 [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-1/dev","name":"FLUX.1 [dev]","created_by":"fal","source":"official","description":"FLUX.1 [dev] is a 12 billion parameter flow transformer that generates high-quality images from text.","status":"active","release_date":"2025-06-02","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/dev","tagline":"FLUX.1 [dev] is a 12 billion parameter flow transformer that generates high-quality images from text.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-1/krea/image-to-image","name":"FLUX.1 Krea [dev]","created_by":"fal","source":"official","description":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-07-30","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/krea/image-to-image","tagline":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-1/krea/redux","name":"FLUX.1 Krea [dev] Redux","created_by":"fal","source":"official","description":"FLUX.1 Krea [dev] Redux is a high-performance endpoint for the FLUX.1 Krea [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificat","status":"active","release_date":"2025-07-30","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/krea/redux","tagline":"FLUX.1 Krea [dev] Redux is a high-performance endpoint for the FLUX.1 Krea [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificat","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-1/krea","name":"FLUX.1 Krea [dev]","created_by":"fal","source":"official","description":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-07-30","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/krea","tagline":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-1/schnell/redux","name":"FLUX.1 [schnell] Redux","created_by":"fal","source":"official","description":"FLUX.1 [schnell] Redux is a high-performance endpoint for the FLUX.1 [schnell] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with the core FLUX capabilities.","status":"active","release_date":"2025-06-02","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/schnell/redux","tagline":"FLUX.1 [schnell] Redux is a high-performance endpoint for the FLUX.1 [schnell] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificatio","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-1/schnell","name":"FLUX.1 [schnell]","created_by":"fal","source":"official","description":"Fastest inference in the world for the 12 billion parameter FLUX.1 [schnell] text-to-image model.","status":"active","release_date":"2025-06-02","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/schnell","tagline":"Fastest inference in the world for the 12 billion parameter FLUX.1 [schnell] text-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-19","last_updated":"2026-06-03"},{"id":"fal-ai/flux-1/srpo/image-to-image","name":"FLUX.1 SRPO [dev]","created_by":"fal","source":"official","description":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-09-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/srpo/image-to-image","tagline":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-1/srpo","name":"FLUX.1 SRPO [dev]","created_by":"fal","source":"official","description":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-09-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-1/srpo","tagline":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-2/edit","name":"FLUX 2 Edit","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-11-23","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/edit","tagline":"Image-to-image editing with FLUX.2 [dev] from Black Forest Labs.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2/flash/edit","name":"FLUX 2 Flash Edit","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/flash/edit","tagline":"Image-to-image editing with FLUX.2 [dev] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2/flash","name":"FLUX 2 Flash","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/flash","tagline":"Text-to-image generation with FLUX.2 [dev] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2-flex/edit","name":"Flux 2 Flex","created_by":"fal","source":"official","description":"Image editing with FLUX.2 [flex] from Black Forest Labs.","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-flex/edit","tagline":"Image editing with FLUX.2 [flex] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-flex","name":"Flux 2 Flex","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [flex] from Black Forest Labs.","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-flex","tagline":"Text-to-image generation with FLUX.2 [flex] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b/base/edit/lora","name":"FLUX.2 [klein] 4B Base LoRA","created_by":"fal","source":"official","description":"Image-to-image editing with LoRA support for FLUX.2 [klein] 4B Base from Black Forest Labs.","status":"active","release_date":"2026-01-19","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b/base/edit/lora","tagline":"Image-to-image editing with LoRA support for FLUX.2 [klein] 4B Base from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b/base/edit","name":"FLUX.2 [klein] 4B Base","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [klein] 4B Base from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b/base/edit","tagline":"Image-to-image editing with FLUX.2 [klein] 4B Base from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b/base/lora","name":"FLUX.2 [klein] 4B Base LoRA","created_by":"fal","source":"official","description":"Text-to-image generation with LoRA support for FLUX.2 [klein] 4B Base from Black Forest Labs.","status":"active","release_date":"2026-01-19","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b/base/lora","tagline":"Text-to-image generation with LoRA support for FLUX.2 [klein] 4B Base from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-klein-4b-base-trainer/edit","name":"Flux 2 Klein 4B Base Trainer","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [klein] 4B from Black Forest Labs with custom datasets.","status":"active","release_date":"2026-01-16","model_type":"other","parameters":4,"page_url":"https://fal.run/fal-ai/flux-2-klein-4b-base-trainer/edit","tagline":"Fine-tune FLUX.2 [klein] 4B from Black Forest Labs with custom datasets.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-klein-4b-base-trainer","name":"Flux 2 Klein 4B Base Trainer","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [klein] 4B from Black Forest Labs with custom datasets.","status":"active","release_date":"2026-01-17","model_type":"other","parameters":4,"page_url":"https://fal.run/fal-ai/flux-2-klein-4b-base-trainer","tagline":"Fine-tune FLUX.2 [klein] 4B from Black Forest Labs with custom datasets.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b/base","name":"FLUX.2 [klein] 4B Base","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [klein] 4B Base from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b/base","tagline":"Text-to-image generation with FLUX.2 [klein] 4B Base from Black Forest Labs.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b/edit/lora","name":"FLUX.2 [klein] 4B LoRA","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [klein] 4B from Black Forest Labs and custom LoRA.","status":"active","release_date":"2026-03-17","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b/edit/lora","tagline":"Image-to-image editing with FLUX.2 [klein] 4B from Black Forest Labs and custom LoRA.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b/edit","name":"FLUX.2 [klein] 4B","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [klein] 4B from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b/edit","tagline":"Image-to-image editing with FLUX.2 [klein] 4B from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b/lora","name":"FLUX.2 [klein] 4B LoRA","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [klein] 4B from Black Forest Labs and custom LoRA.","status":"active","release_date":"2026-03-17","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b/lora","tagline":"Text-to-image generation with FLUX.2 [klein] 4B from Black Forest Labs and custom LoRA.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/4b","name":"FLUX.2 [klein] 4B","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [klein] 4B from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/4b","tagline":"Text-to-image generation with FLUX.2 [klein] 4B from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/9b/base/edit/lora","name":"FLUX.2 [klein] 9B Base LoRA","created_by":"fal","source":"official","description":"Image-to-image editing with LoRA support for FLUX.2 [klein] 9B Base from Black Forest Labs.","status":"active","release_date":"2026-01-19","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b/base/edit/lora","tagline":"Image-to-image editing with LoRA support for FLUX.2 [klein] 9B Base from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/9b/base/edit","name":"FLUX.2 [klein] 9B Base","created_by":"fal","source":"official","description":"Image-to-image editing with Flux 2 [klein] 9B Base from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b/base/edit","tagline":"Image-to-image editing with Flux 2 [klein] 9B Base from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/9b/base/lora","name":"FLUX.2 [klein] 9B Base LoRA","created_by":"fal","source":"official","description":"Text-to-image generation with LoRA support for FLUX.2 [klein] 9B Base from Black Forest Labs.","status":"active","release_date":"2026-01-19","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b/base/lora","tagline":"Text-to-image generation with LoRA support for FLUX.2 [klein] 9B Base from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-klein-9b-base-trainer/edit","name":"Flux 2 Klein 9B Base Trainer","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [klein] 9B from Black Forest Labs with custom datasets.","status":"active","release_date":"2026-01-17","model_type":"other","parameters":9,"page_url":"https://fal.run/fal-ai/flux-2-klein-9b-base-trainer/edit","tagline":"Fine-tune FLUX.2 [klein] 9B from Black Forest Labs with custom datasets.","last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"fal-ai/flux-2-klein-9b-base-trainer","name":"FLUX 2 [klein] 9b Base Trainer","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [klein] 9B from Black Forest Labs with custom datasets.","status":"active","release_date":"2026-01-17","model_type":"other","parameters":9,"page_url":"https://fal.run/fal-ai/flux-2-klein-9b-base-trainer","tagline":"Fine-tune FLUX.2 [klein] 9B from Black Forest Labs with custom datasets.","last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"fal-ai/flux-2/klein/9b/base","name":"FLUX.2 [klein] 9B Base","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [klein] 9B Base from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b/base","tagline":"Text-to-image generation with FLUX.2 [klein] 9B Base from Black Forest Labs.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/9b/edit/lora","name":"FLUX.2 [klein] 9B LoRA","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [klein] 9B from Black Forest Labs and custom LoRA.","status":"active","release_date":"2026-03-17","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b/edit/lora","tagline":"Image-to-image editing with FLUX.2 [klein] 9B from Black Forest Labs and custom LoRA.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-20","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/9b/edit","name":"FLUX.2 [klein] 9B","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [klein] 9B from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b/edit","tagline":"Image-to-image editing with FLUX.2 [klein] 9B from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/9b/lora","name":"FLUX.2 [klein] 9B LoRA","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [klein] 9B from Black Forest Labs and custom LoRA.","status":"active","release_date":"2026-03-17","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b/lora","tagline":"Text-to-image generation with FLUX.2 [klein] 9B from Black Forest Labs and custom LoRA.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-20","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/klein/9b","name":"FLUX.2 [klein] 9B","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [klein] 9B from Black Forest Labs.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/9b","tagline":"Text-to-image generation with FLUX.2 [klein] 9B from Black Forest Labs.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-30","last_updated":"2026-06-30"},{"id":"fal-ai/flux-2/klein/realtime","name":"Flux 2 [klein] Realtime","created_by":"fal","source":"official","description":"Realtime generation with FLUX.2 [klein] from Black Forest Labs.","status":"active","release_date":"2026-02-05","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/klein/realtime","tagline":"Realtime generation with FLUX.2 [klein] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-02-09","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/lora/edit","name":"FLUX 2 Lora Edit","created_by":"fal","source":"official","description":"Image-to-image editing with LoRA support for FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-11-23","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/lora/edit","tagline":"Image-to-image editing with LoRA support for FLUX.2 [dev] from Black Forest Labs.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2-lora-gallery/add-background","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Add a background to images with white/clean background","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/add-background","tagline":"Add a background to images with white/clean background","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/apartment-staging","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Virtually furnishes an empty apartment","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/apartment-staging","tagline":"Virtually furnishes an empty apartment","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/ballpoint-pen-sketch","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Ballpoint pen sketch drawing style","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/ballpoint-pen-sketch","tagline":"Ballpoint pen sketch drawing style","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/digital-comic-art","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Transforms images into comic book style","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/digital-comic-art","tagline":"Transforms images into comic book style","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/face-to-full-portrait","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Extends a face into a full body portrait","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/face-to-full-portrait","tagline":"Extends a face into a full body portrait","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/hdr-style","name":"FLUX 2 Lora Gallery Hdr Style","created_by":"fal","source":"official","description":"HDR surrealistic effect with intense colors","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/hdr-style","tagline":"HDR surrealistic effect with intense colors","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2-lora-gallery/multiple-angles","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Generates same object from different angles (azimuth/elevation)","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/multiple-angles","tagline":"Generates same object from different angles (azimuth/elevation)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/realism","name":"FLUX 2 Lora Gallery Realism","created_by":"fal","source":"official","description":"Makes images more photorealistic and natural","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/realism","tagline":"Makes images more photorealistic and natural","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2-lora-gallery/satellite-view-style","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Generates satellite/aerial view style images","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/satellite-view-style","tagline":"Generates satellite/aerial view style images","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/sepia-vintage","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Applies sepia vintage effect to images","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/sepia-vintage","tagline":"Applies sepia vintage effect to images","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-lora-gallery/virtual-tryon","name":"Flux 2 Lora Gallery","created_by":"fal","source":"official","description":"Virtual clothing try-on (2 images: person + garment)","status":"active","release_date":"2025-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-lora-gallery/virtual-tryon","tagline":"Virtual clothing try-on (2 images: person + garment)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2/lora","name":"FLUX 2 Lora","created_by":"fal","source":"official","description":"Text-to-image generation with LoRA support for FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-11-23","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/lora","tagline":"Text-to-image generation with LoRA support for FLUX.2 [dev] from Black Forest Labs.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2-max/edit","name":"Flux 2 Max","created_by":"fal","source":"official","description":"FLUX.2 [max] delivers state-of-the-art image generation and advanced image editing with exceptional realism, precision, and consistency.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-max/edit","tagline":"FLUX.2 [max] delivers state-of-the-art image generation and advanced image editing with exceptional realism, precision, and consistency.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-24","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-max","name":"Flux 2 Max","created_by":"fal","source":"official","description":"FLUX.2 [max] delivers state-of-the-art image generation and advanced image editing with exceptional realism, precision, and consistency.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-max","tagline":"FLUX.2 [max] delivers state-of-the-art image generation and advanced image editing with exceptional realism, precision, and consistency.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-pro/edit","name":"FLUX 2 Pro Edit","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [pro] from Black Forest Labs.","status":"active","release_date":"2025-11-23","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-pro/edit","tagline":"Text-to-image generation with FLUX.2 [pro] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2-pro/outpaint","name":"FLUX 2 Pro Outpaint","created_by":"fal","source":"official","description":"Outpainting generation with FLUX.2 [pro] from Black Forest Labs.","status":"active","release_date":"2026-05-14","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-pro/outpaint","tagline":"Outpainting generation with FLUX.2 [pro] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-2-pro","name":"Flux 2 Pro","created_by":"fal","source":"official","description":"Image editing with FLUX.2 [pro] from Black Forest Labs.","status":"active","release_date":"2025-11-23","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2-pro","tagline":"Image editing with FLUX.2 [pro] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-2-trainer/edit","name":"FLUX 2 Trainer Edit","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","status":"active","release_date":"2025-11-25","model_type":"other","page_url":"https://fal.run/fal-ai/flux-2-trainer/edit","tagline":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"fal-ai/flux-2-trainer-v2/edit","name":"FLUX 2 Trainer V2 Edit","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","status":"active","release_date":"2026-01-10","model_type":"other","page_url":"https://fal.run/fal-ai/flux-2-trainer-v2/edit","tagline":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"fal-ai/flux-2-trainer-v2","name":"FLUX 2 Trainer V2","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","status":"active","release_date":"2026-01-10","model_type":"other","page_url":"https://fal.run/fal-ai/flux-2-trainer-v2","tagline":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"fal-ai/flux-2-trainer","name":"FLUX 2 Trainer","created_by":"fal","source":"official","description":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","status":"active","release_date":"2025-11-25","model_type":"other","page_url":"https://fal.run/fal-ai/flux-2-trainer","tagline":"Fine-tune FLUX.2 [dev] from Black Forest Labs with custom datasets.","last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"fal-ai/flux-2/turbo/edit","name":"FLUX 2 Turbo Edit","created_by":"fal","source":"official","description":"Image-to-image editing with FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/turbo/edit","tagline":"Image-to-image editing with FLUX.2 [dev] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2/turbo","name":"FLUX 2 Turbo","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2/turbo","tagline":"Text-to-image generation with FLUX.2 [dev] from Black Forest Labs.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/flux-2","name":"FLUX 2","created_by":"fal","source":"official","description":"Text-to-image generation with FLUX.2 [dev] from Black Forest Labs.","status":"active","release_date":"2025-11-23","model_type":"image","page_url":"https://fal.run/fal-ai/flux-2","tagline":"Text-to-image generation with FLUX.2 [dev] from Black Forest Labs.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-27","last_updated":"2026-06-03"},{"id":"fal-ai/flux-control-lora-canny/image-to-image","name":"FLUX.1 [dev] Control LoRA Canny","created_by":"fal","source":"official","description":"FLUX Control LoRA Canny is a high-performance endpoint that uses a control image using a Canny edge map to transfer structure to the generated image and another initial image to guide color.","status":"active","release_date":"2025-02-11","model_type":"image","page_url":"https://fal.run/fal-ai/flux-control-lora-canny/image-to-image","tagline":"FLUX Control LoRA Canny is a high-performance endpoint that uses a control image using a Canny edge map to transfer structure to the generated image and another initial image to guide color.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-control-lora-canny","name":"FLUX.1 [dev] Control LoRA Canny","created_by":"fal","source":"official","description":"FLUX Control LoRA Canny is a high-performance endpoint that uses a control image to transfer structure to the generated image, using a Canny edge map.","status":"active","release_date":"2025-02-11","model_type":"image","page_url":"https://fal.run/fal-ai/flux-control-lora-canny","tagline":"FLUX Control LoRA Canny is a high-performance endpoint that uses a control image to transfer structure to the generated image, using a Canny edge map.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-control-lora-depth/image-to-image","name":"FLUX.1 [dev] Control LoRA Depth","created_by":"fal","source":"official","description":"FLUX Control LoRA Depth is a high-performance endpoint that uses a control image using a depth map to transfer structure to the generated image and another initial image to guide color.","status":"active","release_date":"2025-02-11","model_type":"image","page_url":"https://fal.run/fal-ai/flux-control-lora-depth/image-to-image","tagline":"FLUX Control LoRA Depth is a high-performance endpoint that uses a control image using a depth map to transfer structure to the generated image and another initial image to guide color.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-control-lora-depth","name":"FLUX.1 [dev] Control LoRA Depth","created_by":"fal","source":"official","description":"FLUX Control LoRA Depth is a high-performance endpoint that uses a control image to transfer structure to the generated image, using a depth map.","status":"active","release_date":"2025-02-11","model_type":"image","page_url":"https://fal.run/fal-ai/flux-control-lora-depth","tagline":"FLUX Control LoRA Depth is a high-performance endpoint that uses a control image to transfer structure to the generated image, using a depth map.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux/dev/image-to-image","name":"FLUX.1 [dev]","created_by":"fal","source":"official","description":"FLUX.1 Image-to-Image is a high-performance endpoint for the FLUX.1 [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications wi","status":"active","release_date":"2024-07-11","model_type":"image","page_url":"https://fal.run/fal-ai/flux/dev/image-to-image","tagline":"FLUX.1 Image-to-Image is a high-performance endpoint for the FLUX.1 [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications wi","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux/dev/redux","name":"FLUX.1 [dev] Redux","created_by":"fal","source":"official","description":"FLUX.1 [dev] Redux is a high-performance endpoint for the FLUX.1 [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with ","status":"active","release_date":"2024-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/flux/dev/redux","tagline":"FLUX.1 [dev] Redux is a high-performance endpoint for the FLUX.1 [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux/dev","name":"FLUX.1 [dev]","created_by":"fal","source":"official","description":"FLUX.1 [dev] is a 12 billion parameter flow transformer that generates high-quality images from text.","status":"active","release_date":"2025-04-01","model_type":"image","page_url":"https://fal.run/fal-ai/flux/dev","tagline":"FLUX.1 [dev] is a 12 billion parameter flow transformer that generates high-quality images from text.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-differential-diffusion","name":"FLUX.1 [dev] Differential Diffusion","created_by":"fal","source":"official","description":"FLUX.1 Differential Diffusion is a rapid endpoint that enables swift, granular control over image transformations through change maps, delivering fast and precise region-specific modifications while m","status":"active","release_date":"2024-11-06","model_type":"image","page_url":"https://fal.run/fal-ai/flux-differential-diffusion","tagline":"FLUX.1 Differential Diffusion is a rapid endpoint that enables swift, granular control over image transformations through change maps, delivering fast and precise region-specific modifications while m","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-general/differential-diffusion","name":"FLUX.1 [dev] with Controlnets and Loras","created_by":"fal","source":"official","description":"A specialized FLUX endpoint combining differential diffusion control with LoRA, ControlNet, and IP-Adapter support, enabling precise, region-specific image transformations through customizable change ","status":"active","release_date":"2024-08-13","model_type":"image","page_url":"https://fal.run/fal-ai/flux-general/differential-diffusion","tagline":"A specialized FLUX endpoint combining differential diffusion control with LoRA, ControlNet, and IP-Adapter support, enabling precise, region-specific image transformations through customizable change ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-general/image-to-image","name":"FLUX.1 [dev] with Controlnets and Loras","created_by":"fal","source":"official","description":"FLUX General Image-to-Image is a versatile endpoint that transforms existing images with support for LoRA, ControlNet, and IP-Adapter extensions, enabling precise control over style transfer, modifica","status":"active","release_date":"2024-08-14","model_type":"image","page_url":"https://fal.run/fal-ai/flux-general/image-to-image","tagline":"FLUX General Image-to-Image is a versatile endpoint that transforms existing images with support for LoRA, ControlNet, and IP-Adapter extensions, enabling precise control over style transfer, modifica","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-general/inpainting","name":"FLUX.1 [dev] with Controlnets and Loras","created_by":"fal","source":"official","description":"FLUX General Inpainting is a versatile endpoint that enables precise image editing and completion, supporting multiple AI extensions including LoRA, ControlNet, and IP-Adapter for enhanced control ove","status":"active","release_date":"2024-08-14","model_type":"image","page_url":"https://fal.run/fal-ai/flux-general/inpainting","tagline":"FLUX General Inpainting is a versatile endpoint that enables precise image editing and completion, supporting multiple AI extensions including LoRA, ControlNet, and IP-Adapter for enhanced control ove","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-general/rf-inversion","name":"FLUX.1 [dev] with Controlnets and Loras","created_by":"fal","source":"official","description":"A general purpose endpoint for the FLUX.1 [dev] model, implementing the RF-Inversion pipeline.","status":"active","release_date":"2024-09-17","model_type":"image","page_url":"https://fal.run/fal-ai/flux-general/rf-inversion","tagline":"A general purpose endpoint for the FLUX.1 [dev] model, implementing the RF-Inversion pipeline.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-general","name":"FLUX.1 [dev] with Controlnets and Loras","created_by":"fal","source":"official","description":"A versatile endpoint for the FLUX.1 [dev] model that supports multiple AI extensions including LoRA, ControlNet conditioning, and IP-Adapter integration, enabling comprehensive control over image gene","status":"active","release_date":"2024-08-21","model_type":"image","page_url":"https://fal.run/fal-ai/flux-general","tagline":"A versatile endpoint for the FLUX.1 [dev] model that supports multiple AI extensions including LoRA, ControlNet conditioning, and IP-Adapter integration, enabling comprehensive control over image gene","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-kontext/dev","name":"FLUX.1 Kontext [dev]","created_by":"fal","source":"official","description":"Frontier image editing model.","status":"active","release_date":"2025-05-28","model_type":"image","page_url":"https://fal.run/fal-ai/flux-kontext/dev","tagline":"Frontier image editing model.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-kontext-lora/inpaint","name":"Flux Kontext Lora","created_by":"fal","source":"official","description":"Fast inpainting endpoint for the FLUX.1 Kontext [dev] model with LoRA support, enabling rapid and high-quality image inpainting with reference images, while using pre-trained LoRA adaptations for spec","status":"active","release_date":"2025-07-29","model_type":"image","page_url":"https://fal.run/fal-ai/flux-kontext-lora/inpaint","tagline":"Fast inpainting endpoint for the FLUX.1 Kontext [dev] model with LoRA support, enabling rapid and high-quality image inpainting with reference images, while using pre-trained LoRA adaptations for spec","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-kontext-lora/text-to-image","name":"Flux Kontext Lora","created_by":"fal","source":"official","description":"Super fast text-to-image endpoint for the FLUX.1 Kontext [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specifi","status":"active","release_date":"2025-06-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-kontext-lora/text-to-image","tagline":"Super fast text-to-image endpoint for the FLUX.1 Kontext [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specifi","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-kontext-lora","name":"Flux Kontext Lora","created_by":"fal","source":"official","description":"Fast endpoint for the FLUX.1 Kontext [dev] model with LoRA support, enabling rapid and high-quality image editing using pre-trained LoRA adaptations for specific styles, brand identities, and product-","status":"active","release_date":"2025-06-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux-kontext-lora","tagline":"Fast endpoint for the FLUX.1 Kontext [dev] model with LoRA support, enabling rapid and high-quality image editing using pre-trained LoRA adaptations for specific styles, brand identities, and product-","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-kontext-trainer","name":"Flux Kontext Trainer","created_by":"fal","source":"official","description":"LoRA trainer for FLUX.1 Kontext [dev]","status":"active","release_date":"2025-06-26","model_type":"other","page_url":"https://fal.run/fal-ai/flux-kontext-trainer","tagline":"LoRA trainer for FLUX.1 Kontext [dev]","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux/krea/image-to-image","name":"FLUX.1 Krea [dev]","created_by":"fal","source":"official","description":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-07-30","model_type":"image","page_url":"https://fal.run/fal-ai/flux/krea/image-to-image","tagline":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-krea-lora/image-to-image","name":"FLUX.1 Krea [dev] with LoRAs","created_by":"fal","source":"official","description":"FLUX LoRA Image-to-Image is a high-performance endpoint that transforms existing images using FLUX models, leveraging LoRA adaptations to enable rapid and precise image style transfer, modifications, ","status":"active","release_date":"2025-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/flux-krea-lora/image-to-image","tagline":"FLUX LoRA Image-to-Image is a high-performance endpoint that transforms existing images using FLUX models, leveraging LoRA adaptations to enable rapid and precise image style transfer, modifications, ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-krea-lora/inpainting","name":"FLUX.1 Krea [dev] Inpainting with LoRAs","created_by":"fal","source":"official","description":"Super fast endpoint for the FLUX.1 [dev] inpainting model with LoRA support, enabling rapid and high-quality image inpaingting using pre-trained LoRA adaptations for personalization, specific styles, ","status":"active","release_date":"2025-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/flux-krea-lora/inpainting","tagline":"Super fast endpoint for the FLUX.1 [dev] inpainting model with LoRA support, enabling rapid and high-quality image inpaingting using pre-trained LoRA adaptations for personalization, specific styles, ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-krea-lora/stream","name":"Flux Krea Lora","created_by":"fal","source":"official","description":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","status":"active","release_date":"2025-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/flux-krea-lora/stream","tagline":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-krea-lora","name":"FLUX.1 Krea [dev] with LoRAs","created_by":"fal","source":"official","description":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","status":"active","release_date":"2025-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/flux-krea-lora","tagline":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux/krea/redux","name":"FLUX.1 Krea [dev] Redux","created_by":"fal","source":"official","description":"FLUX.1 Krea [dev] Redux is a high-performance endpoint for the FLUX.1 Krea [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificat","status":"active","release_date":"2025-07-30","model_type":"image","page_url":"https://fal.run/fal-ai/flux/krea/redux","tagline":"FLUX.1 Krea [dev] Redux is a high-performance endpoint for the FLUX.1 Krea [dev] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificat","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-krea-trainer","name":"Train Flux Krea LoRA","created_by":"fal","source":"official","description":"Train styles, people and other subjects at blazing speeds using the FLUX.1 Krea [dev] base model.","status":"active","release_date":"2025-08-01","model_type":"other","page_url":"https://fal.run/fal-ai/flux-krea-trainer","tagline":"Train styles, people and other subjects at blazing speeds using the FLUX.1 Krea [dev] base model.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux/krea","name":"FLUX.1 Krea [dev]","created_by":"fal","source":"official","description":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-07-30","model_type":"image","page_url":"https://fal.run/fal-ai/flux/krea","tagline":"FLUX.1 Krea [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora-canny","name":"FLUX.1 [dev] Canny with LoRAs","created_by":"fal","source":"official","description":"Utilize Flux.1 [dev] Controlnet to generate high-quality images with precise control over composition, style, and structure through advanced edge detection and guidance mechanisms.","status":"active","release_date":"2025-01-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-lora-canny","tagline":"Utilize Flux.1 [dev] Controlnet to generate high-quality images with precise control over composition, style, and structure through advanced edge detection and guidance mechanisms.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora-depth","name":"FLUX.1 [dev] Depth with LoRAs","created_by":"fal","source":"official","description":"Generate high-quality images from depth maps using Flux.1 [dev] depth estimation model.","status":"active","release_date":"2024-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/flux-lora-depth","tagline":"Generate high-quality images from depth maps using Flux.1 [dev] depth estimation model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora-fast-training","name":"Train Flux LoRA","created_by":"fal","source":"official","description":"Train styles, people and other subjects at blazing speeds.","status":"active","release_date":"2025-01-01","model_type":"other","page_url":"https://fal.run/fal-ai/flux-lora-fast-training","tagline":"Train styles, people and other subjects at blazing speeds.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora-fill","name":"FLUX.1 [dev] Fill with LoRAs","created_by":"fal","source":"official","description":"FLUX.1 [dev] Fill is a high-performance endpoint for the FLUX.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with t","status":"active","release_date":"2024-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/flux-lora-fill","tagline":"FLUX.1 [dev] Fill is a high-performance endpoint for the FLUX.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with t","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora/image-to-image","name":"FLUX.1 [dev] with LoRAs","created_by":"fal","source":"official","description":"FLUX LoRA Image-to-Image is a high-performance endpoint that transforms existing images using FLUX models, leveraging LoRA adaptations to enable rapid and precise image style transfer, modifications, ","status":"active","release_date":"2024-08-13","model_type":"image","page_url":"https://fal.run/fal-ai/flux-lora/image-to-image","tagline":"FLUX LoRA Image-to-Image is a high-performance endpoint that transforms existing images using FLUX models, leveraging LoRA adaptations to enable rapid and precise image style transfer, modifications, ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora/inpainting","name":"FLUX.1 [dev] Inpainting with LoRAs","created_by":"fal","source":"official","description":"Super fast endpoint for the FLUX.1 [dev] inpainting model with LoRA support, enabling rapid and high-quality image inpaingting using pre-trained LoRA adaptations for personalization, specific styles, ","status":"active","release_date":"2024-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/flux-lora/inpainting","tagline":"Super fast endpoint for the FLUX.1 [dev] inpainting model with LoRA support, enabling rapid and high-quality image inpaingting using pre-trained LoRA adaptations for personalization, specific styles, ","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora-portrait-trainer","name":"Train Flux LoRAs For Portraits","created_by":"fal","source":"official","description":"FLUX LoRA training optimized for portrait generation, with bright highlights, excellent prompt following and highly detailed results.","status":"active","release_date":"2024-11-07","model_type":"other","page_url":"https://fal.run/fal-ai/flux-lora-portrait-trainer","tagline":"FLUX LoRA training optimized for portrait generation, with bright highlights, excellent prompt following and highly detailed results.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-lora/stream","name":"Flux Lora","created_by":"fal","source":"official","description":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","status":"active","release_date":"2025-05-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux-lora/stream","tagline":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-lora","name":"FLUX.1 [dev] with LoRAs","created_by":"fal","source":"official","description":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","status":"active","release_date":"2024-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/flux-lora","tagline":"Super fast endpoint for the FLUX.1 [dev] model with LoRA support, enabling rapid and high-quality image generation using pre-trained LoRA adaptations for personalization, specific styles, brand identi","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-pro/kontext/max/multi","name":"FLUX.1 Kontext [max]","created_by":"fal","source":"official","description":"Experimental version of FLUX.1 Kontext [max] with multi image handling capabilities","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/kontext/max/multi","tagline":"Experimental version of FLUX.1 Kontext [max] with multi image handling capabilities","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-pro/kontext/max/text-to-image","name":"FLUX.1 Kontext [max]","created_by":"fal","source":"official","description":"FLUX.1 Kontext [max] text-to-image is a new premium model brings maximum performance across all aspects – greatly improved prompt adherence.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/kontext/max/text-to-image","tagline":"FLUX.1 Kontext [max] text-to-image is a new premium model brings maximum performance across all aspects – greatly improved prompt adherence.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/kontext/max","name":"FLUX.1 Kontext [max]","created_by":"fal","source":"official","description":"FLUX.1 Kontext [max] is a model with greatly improved prompt adherence and typography generation meet premium consistency for editing without compromise on speed.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/kontext/max","tagline":"FLUX.1 Kontext [max] is a model with greatly improved prompt adherence and typography generation meet premium consistency for editing without compromise on speed.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-pro/kontext/multi","name":"FLUX.1 Kontext [pro]","created_by":"fal","source":"official","description":"Experimental version of FLUX.1 Kontext [pro] with multi image handling capabilities","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/kontext/multi","tagline":"Experimental version of FLUX.1 Kontext [pro] with multi image handling capabilities","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/kontext/text-to-image","name":"FLUX.1 Kontext [pro]","created_by":"fal","source":"official","description":"The FLUX.1 Kontext [pro] text-to-image delivers state-of-the-art image generation results with unprecedented prompt following, photorealistic rendering, and flawless typography.","status":"active","release_date":"2025-05-28","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/kontext/text-to-image","tagline":"The FLUX.1 Kontext [pro] text-to-image delivers state-of-the-art image generation results with unprecedented prompt following, photorealistic rendering, and flawless typography.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-pro/kontext","name":"FLUX.1 Kontext [pro]","created_by":"fal","source":"official","description":"FLUX.1 Kontext [pro] handles both text and reference images as inputs, seamlessly enabling targeted, local edits and complex transformations of entire scenes.","status":"active","release_date":"2025-05-28","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/kontext","tagline":"FLUX.1 Kontext [pro] handles both text and reference images as inputs, seamlessly enabling targeted, local edits and complex transformations of entire scenes.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/v1/erase","name":"Flux Pro Erase","created_by":"fal","source":"official","description":"Latest object erasing model from Black Forest Labs.","status":"active","release_date":"2026-05-21","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1/erase","tagline":"Latest object erasing model from Black forest labs.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-18","last_updated":"2026-06-20"},{"id":"fal-ai/flux-pro/v1/fill-finetuned","name":"FLUX.1 [pro] Fill Fine-tuned","created_by":"fal","source":"official","description":"FLUX.1 [pro] Fill Fine-tuned is a high-performance endpoint for the FLUX.1 [pro] model with a fine-tuned LoRA that enables rapid transformation of existing images, delivering high-quality style transf","status":"active","release_date":"2025-01-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1/fill-finetuned","tagline":"FLUX.1 [pro] Fill Fine-tuned is a high-performance endpoint for the FLUX.1 [pro] model with a fine-tuned LoRA that enables rapid transformation of existing images, delivering high-quality style transf","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/v1/fill","name":"FLUX.1 [pro] Fill","created_by":"fal","source":"official","description":"FLUX.1 [pro] Fill is a high-performance endpoint for the FLUX.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with t","status":"active","release_date":"2024-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1/fill","tagline":"FLUX.1 [pro] Fill is a high-performance endpoint for the FLUX.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications with t","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/v1/vto","name":"FLUX Virtual Try-On ","created_by":"fal","source":"official","description":"Generate virtual try-on results from a person image plus one or more garment references.","status":"active","release_date":"2026-05-27","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1/vto","tagline":"Generate virtual try-on results from a person image plus one or more garment references.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-pro/v1.1/redux","name":"FLUX1.1 [pro] Redux","created_by":"fal","source":"official","description":"FLUX1.1 [pro] Redux is a high-performance endpoint for the FLUX1.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications wit","status":"active","release_date":"2024-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1.1/redux","tagline":"FLUX1.1 [pro] Redux is a high-performance endpoint for the FLUX1.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modifications wit","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/v1.1-ultra-finetuned","name":"FLUX1.1 [pro] ultra Fine-tuned","created_by":"fal","source":"official","description":"FLUX1.1 [pro] ultra fine-tuned is the newest version of FLUX1.1 [pro] with a fine-tuned LoRA, maintaining professional-grade image quality while delivering up to 2K resolution with improved photo real","status":"active","release_date":"2025-01-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1.1-ultra-finetuned","tagline":"FLUX1.1 [pro] ultra fine-tuned is the newest version of FLUX1.1 [pro] with a fine-tuned LoRA, maintaining professional-grade image quality while delivering up to 2K resolution with improved photo real","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/v1.1-ultra/redux","name":"FLUX1.1 [pro] ultra Redux","created_by":"fal","source":"official","description":"FLUX1.1 [pro] ultra Redux is a high-performance endpoint for the FLUX1.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificatio","status":"active","release_date":"2024-11-21","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1.1-ultra/redux","tagline":"FLUX1.1 [pro] ultra Redux is a high-performance endpoint for the FLUX1.1 [pro] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificatio","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/v1.1-ultra","name":"FLUX1.1 [pro] ultra","created_by":"fal","source":"official","description":"FLUX1.1 [pro] ultra is the newest version of FLUX1.1 [pro], maintaining professional-grade image quality while delivering up to 2K resolution with improved photo realism.","status":"active","release_date":"2024-12-17","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1.1-ultra","tagline":"FLUX1.1 [pro] ultra is the newest version of FLUX1.1 [pro], maintaining professional-grade image quality while delivering up to 2K resolution with improved photo realism.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pro/v1.1","name":"FLUX1.1 [pro]","created_by":"fal","source":"official","description":"FLUX1.1 [pro] is an enhanced version of FLUX.1 [pro], improved image generation capabilities, delivering superior composition, detail, and artistic fidelity compared to its predecessor.","status":"active","release_date":"2025-01-16","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pro/v1.1","tagline":"FLUX1.1 [pro] is an enhanced version of FLUX.1 [pro], improved image generation capabilities, delivering superior composition, detail, and artistic fidelity compared to its predecessor.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux-pulid","name":"PuLID Flux","created_by":"fal","source":"official","description":"An endpoint for personalized image generation using Flux as per given description.","status":"active","release_date":"2024-10-29","model_type":"image","page_url":"https://fal.run/fal-ai/flux-pulid","tagline":"An endpoint for personalized image generation using Flux as per given description.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-10","last_updated":"2026-05-11"},{"id":"fal-ai/flux/schnell/redux","name":"FLUX.1 [schnell] Redux","created_by":"fal","source":"official","description":"FLUX.1 [schnell] Redux is a high-performance endpoint for the FLUX.1 [schnell] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificatio","status":"active","release_date":"2024-11-27","model_type":"image","page_url":"https://fal.run/fal-ai/flux/schnell/redux","tagline":"FLUX.1 [schnell] Redux is a high-performance endpoint for the FLUX.1 [schnell] model that enables rapid transformation of existing images, delivering high-quality style transfers and image modificatio","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/flux/schnell","name":"FLUX.1 [schnell]","created_by":"fal","source":"official","description":"FLUX.1 [schnell] is a 12 billion parameter flow transformer that generates high-quality images from text in 1 to 4 steps, suitable for personal and commercial use.","status":"active","release_date":"2024-11-25","model_type":"image","page_url":"https://fal.run/fal-ai/flux/schnell","tagline":"FLUX.1 [schnell] is a 12 billion parameter flow transformer that generates high-quality images from text in 1 to 4 steps, suitable for personal and commercial use.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux/srpo/image-to-image","name":"FLUX.1 SRPO [dev]","created_by":"fal","source":"official","description":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-09-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux/srpo/image-to-image","tagline":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux/srpo","name":"FLUX.1 SRPO [dev]","created_by":"fal","source":"official","description":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","status":"active","release_date":"2025-09-15","model_type":"image","page_url":"https://fal.run/fal-ai/flux/srpo","tagline":"FLUX.1 SRPO [dev] is a 12 billion parameter flow transformer that generates high-quality images from text with incredible aesthetics.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/flux-subject","name":"FLUX.1 Subject","created_by":"fal","source":"official","description":"Super fast endpoint for the FLUX.1 [schnell] model with subject input capabilities, enabling rapid and high-quality image generation for personalization, specific styles, brand identities, and product","status":"active","release_date":"2024-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/flux-subject","tagline":"Super fast endpoint for the FLUX.1 [schnell] model with subject input capabilities, enabling rapid and high-quality image generation for personalization, specific styles, brand identities, and product","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/flux-vision-upscaler","name":"Flux Vision Upscaler","created_by":"fal","source":"official","description":"Flux Vision Upscaler for magnify/upscaling images with high fidelity and creativity.","status":"active","release_date":"2025-11-02","model_type":"image","page_url":"https://fal.run/fal-ai/flux-vision-upscaler","tagline":"Flux Vision Upscaler for magnify/upscaling images with high fidelity and creativity.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fooocus/image-prompt","name":"Fooocus Image Prompt","created_by":"fal","source":"official","description":"Default parameters with automated optimizations and quality improvements.","status":"active","release_date":"2024-02-13","model_type":"image","page_url":"https://fal.run/fal-ai/fooocus/image-prompt","tagline":"Default parameters with automated optimizations and quality improvements.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fooocus/inpaint","name":"Fooocus Inpainting","created_by":"fal","source":"official","description":"Default parameters with automated optimizations and quality improvements.","status":"active","release_date":"2024-02-13","model_type":"image","page_url":"https://fal.run/fal-ai/fooocus/inpaint","tagline":"Default parameters with automated optimizations and quality improvements.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fooocus/upscale-or-vary","name":"Fooocus Upscale or Vary","created_by":"fal","source":"official","description":"Default parameters with automated optimizations and quality improvements.","status":"active","release_date":"2024-08-12","model_type":"image","page_url":"https://fal.run/fal-ai/fooocus/upscale-or-vary","tagline":"Default parameters with automated optimizations and quality improvements.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/fooocus","name":"Fooocus","created_by":"fal","source":"official","description":"Default parameters with automated optimizations and quality improvements.","status":"active","release_date":"2023-11-16","model_type":"image","page_url":"https://fal.run/fal-ai/fooocus","tagline":"Default parameters with automated optimizations and quality improvements.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/framepack/f1","name":"Framepack F1","created_by":"fal","source":"official","description":"Framepack is an efficient Image-to-video model that autoregressively generates videos.","status":"active","release_date":"2025-05-13","model_type":"video","page_url":"https://fal.run/fal-ai/framepack/f1","tagline":"Framepack is an efficient Image-to-video model that autoregressively generates videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/framepack/flf2v","name":"Framepack","created_by":"fal","source":"official","description":"Framepack is an efficient Image-to-video model that autoregressively generates videos.","status":"active","release_date":"2025-04-22","model_type":"video","page_url":"https://fal.run/fal-ai/framepack/flf2v","tagline":"Framepack is an efficient Image-to-video model that autoregressively generates videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/framepack","name":"Framepack","created_by":"fal","source":"official","description":"Framepack is an efficient Image-to-video model that autoregressively generates videos.","status":"active","release_date":"2025-04-17","model_type":"video","page_url":"https://fal.run/fal-ai/framepack","tagline":"Framepack is an efficient Image-to-video model that autoregressively generates videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/gemini-25-flash-image/edit","name":"Gemini 2.5 Flash Image","created_by":"fal","source":"official","family":"gemini-25","description":"Google's famous original image generation and editing model, a.k.a Nano Banana","status":"active","release_date":"2025-08-26","model_type":"image","page_url":"https://fal.run/fal-ai/gemini-25-flash-image/edit","tagline":"Google's famous original image generation and editing model, a.k.a Nano Banana","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/gemini-25-flash-image","name":"Gemini 2.5 Flash Image","created_by":"fal","source":"official","family":"gemini-25","description":"Google's famous original image generation and editing model, a.k.a Nano Banana","status":"active","release_date":"2025-08-26","model_type":"image","page_url":"https://fal.run/fal-ai/gemini-25-flash-image","tagline":"Google's famous original image generation and editing model, a.k.a Nano Banana","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/gemini-3-pro-image-preview/edit","name":"Gemini 3 Pro Image Preview","created_by":"fal","source":"official","family":"gemini-3","description":"Gemini 3 Pro Image (a.k.a Nano Banana Pro) is Google's state-of-the-art high-fidelity image generation and editing model","status":"active","release_date":"2025-11-20","model_type":"image","page_url":"https://fal.run/fal-ai/gemini-3-pro-image-preview/edit","tagline":"Gemini 3 Pro Image (a.k.a Nano Banana Pro) is Google's state-of-the-art high-fidelity image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/gemini-3-pro-image-preview","name":"Gemini 3 Pro Image Preview","created_by":"fal","source":"official","family":"gemini-3","description":"Gemini 3 Pro Image (a.k.a Nano Banana Pro) is Google's state-of-the-art high-fidelity image generation and editing model","status":"active","release_date":"2025-11-20","model_type":"image","page_url":"https://fal.run/fal-ai/gemini-3-pro-image-preview","tagline":"Gemini 3 Pro Image (a.k.a Nano Banana Pro) is Google's state-of-the-art high-fidelity image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/gemini-3.1-flash-image-preview/edit","name":"Gemini 3.1 Flash Image Preview","created_by":"fal","source":"official","family":"gemini-3.1","description":"Gemini 3.1 Flash Image (a.k.a.","status":"active","release_date":"2026-02-26","model_type":"image","page_url":"https://fal.run/fal-ai/gemini-3.1-flash-image-preview/edit","tagline":"Gemini 3.1 Flash Image (a.k.a.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/gemini-3.1-flash-image-preview","name":"Gemini 3.1 Flash Image Preview","created_by":"fal","source":"official","family":"gemini-3.1","description":"Gemini 3.1 Flash Image (a.k.a Nano Banana 2) is Google's new state-of-the-art fast image generation and editing model","status":"active","release_date":"2026-02-26","model_type":"image","page_url":"https://fal.run/fal-ai/gemini-3.1-flash-image-preview","tagline":"Gemini 3.1 Flash Image (a.k.a Nano Banana 2) is Google's new state-of-the-art fast image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/gemini-3.1-flash-tts","name":"Gemini 3.1 Flash Tts","created_by":"fal","source":"official","family":"gemini-3.1","description":"Newest audio model from Google introduces granular audio tags that give you precise control to direct AI speech for expressive audio generation.","status":"active","release_date":"2026-04-16","model_type":"tts","page_url":"https://fal.run/fal-ai/gemini-3.1-flash-tts","tagline":"Newest audio model from Google introduces granular audio tags that give you precise control to direct AI speech for expressive audio generation.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/gemini-tts","name":"Gemini TTS","created_by":"fal","source":"official","description":"Use Gemini TTS Models to convert your prompts to real audio.","status":"active","release_date":"2026-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/gemini-tts","tagline":"Use Gemini TTS Models to convert your prompts to real audio.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/genfocus/all-in-focus","name":"Genfocus","created_by":"fal","source":"official","description":"GenFocus Model to Refocus Images","status":"active","release_date":"2026-02-14","model_type":"image","page_url":"https://fal.run/fal-ai/genfocus/all-in-focus","tagline":"GenFocus Model to Refocus Images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-02-14","last_updated":"2026-05-11"},{"id":"fal-ai/genfocus","name":"Genfocus","created_by":"fal","source":"official","description":"GenFocus Model to Refocus Images","status":"active","release_date":"2026-02-14","model_type":"image","page_url":"https://fal.run/fal-ai/genfocus","tagline":"GenFocus Model to Refocus Images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-02-14","last_updated":"2026-05-11"},{"id":"fal-ai/ghiblify","name":"Ghiblify Images","created_by":"fal","source":"official","description":"Reimagine and transform your ordinary photos into enchanting Studio Ghibli style artwork","status":"active","release_date":"2025-03-31","model_type":"image","page_url":"https://fal.run/fal-ai/ghiblify","tagline":"Reimagine and transform your ordinary photos into enchanting Studio Ghibli style artwork","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/glm-image/image-to-image","name":"Glm Image","created_by":"fal","source":"official","family":"glm","description":"Create high-quality images with accurate text rendering and rich knowledge details—supports editing, style transfer, and maintaining consistent characters across multiple images.","status":"active","release_date":"2026-01-14","model_type":"image","page_url":"https://fal.run/fal-ai/glm-image/image-to-image","tagline":"Create high-quality images with accurate text rendering and rich knowledge details—supports editing, style transfer, and maintaining consistent characters across multiple images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/glm-image","name":"Glm Image","created_by":"fal","source":"official","family":"glm","description":"Create high-quality images with accurate text rendering and rich knowledge details—supports editing, style transfer, and maintaining consistent characters across multiple images.","status":"active","release_date":"2026-01-14","model_type":"image","page_url":"https://fal.run/fal-ai/glm-image","tagline":"Create high-quality images with accurate text rendering and rich knowledge details—supports editing, style transfer, and maintaining consistent characters across multiple images.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/goal-force","name":"Goal Force","created_by":"fal","source":"official","description":"Physics-based video generation with Goal Force.","status":"active","release_date":"2026-03-17","model_type":"video","page_url":"https://fal.run/fal-ai/goal-force","tagline":"Physics-based video generation with Goal Force.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/got-ocr/v2","name":"GOT OCR 2.0","created_by":"fal","source":"official","description":"GOT-OCR2 works on a wide range of tasks, including plain document OCR, scene text OCR, formatted document OCR, and even OCR for tables, charts, mathematical formulas, geometric shapes, molecular formu","status":"active","release_date":"2025-02-12","model_type":"other","page_url":"https://fal.run/fal-ai/got-ocr/v2","tagline":"GOT-OCR2 works on a wide range of tasks, including plain document OCR, scene text OCR, formatted document OCR, and even OCR for tables, charts, mathematical formulas, geometric shapes, molecular formu","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/gpt-image-1/edit-image","name":"gpt-image-1","created_by":"fal","source":"official","family":"gpt-image-1","description":"OpenAI's latest image generation and editing model: gpt-1-image.","status":"active","release_date":"2025-04-23","model_type":"image","page_url":"https://fal.run/fal-ai/gpt-image-1/edit-image","tagline":"OpenAI's latest image generation and editing model: gpt-1-image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/gpt-image-1-mini/edit","name":"GPT Image 1 Mini","created_by":"fal","source":"official","family":"gpt-image-1","description":"GPT Image 1 mini combines OpenAI's advanced language capabilities, powered by GPT-5, with GPT Image 1 Mini for efficient image generation.","status":"active","release_date":"2025-10-21","model_type":"image","page_url":"https://fal.run/fal-ai/gpt-image-1-mini/edit","tagline":"GPT Image 1 mini combines OpenAI's advanced language capabilities, powered by GPT-5, with GPT Image 1 Mini for efficient image generation.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/gpt-image-1-mini","name":"GPT Image 1 Mini","created_by":"fal","source":"official","family":"gpt-image-1","description":"GPT Image 1 mini combines OpenAI's advanced language capabilities, powered by GPT-5, with GPT Image 1 Mini for efficient image generation.","status":"active","release_date":"2025-10-21","model_type":"image","page_url":"https://fal.run/fal-ai/gpt-image-1-mini","tagline":"GPT Image 1 mini combines OpenAI's advanced language capabilities, powered by GPT-5, with GPT Image 1 Mini for efficient image generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/gpt-image-1/text-to-image","name":"gpt-image-1","created_by":"fal","source":"official","family":"gpt-image-1","description":"OpenAI's latest image generation and editing model: gpt-1-image.","status":"active","release_date":"2025-04-23","model_type":"image","page_url":"https://fal.run/fal-ai/gpt-image-1/text-to-image","tagline":"OpenAI's latest image generation and editing model: gpt-1-image.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/gpt-image-1.5/edit","name":"GPT-Image 1.5","created_by":"fal","source":"official","family":"gpt-image-1.5","description":"GPT Image 1.5 generates high-fidelity images with strong prompt adherence, preserving composition, lighting, and fine-grained detail.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/gpt-image-1.5/edit","tagline":"GPT Image 1.5 generates high-fidelity images with strong prompt adherence, preserving composition, lighting, and fine-grained detail.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/gpt-image-1.5","name":"GPT-Image 1.5","created_by":"fal","source":"official","family":"gpt-image-1.5","description":"GPT Image 1.5 generates high-fidelity images with strong prompt adherence, preserving composition, lighting, and fine-grained detail.","status":"active","release_date":"2025-12-16","model_type":"image","page_url":"https://fal.run/fal-ai/gpt-image-1.5","tagline":"GPT Image 1.5 generates high-fidelity images with strong prompt adherence, preserving composition, lighting, and fine-grained detail.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/avatar3/digital-twin","name":"Heygen","created_by":"fal","source":"official","description":"Heygen Avatar V3 Model for Digital Twin","status":"active","release_date":"2026-02-23","model_type":"video","page_url":"https://fal.run/fal-ai/heygen/avatar3/digital-twin","tagline":"Heygen Avatar V3 Model for Digital Twin","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/avatar4/digital-twin","name":"Heygen","created_by":"fal","source":"official","description":"Heygen Avatar 4 Digital Twin Model","status":"active","release_date":"2026-02-23","model_type":"video","page_url":"https://fal.run/fal-ai/heygen/avatar4/digital-twin","tagline":"Heygen Avatar 4 Digital Twin Model","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/avatar4/image-to-video","name":"Heygen","created_by":"fal","source":"official","description":"Heygen Photo Avatar 4 Model","status":"active","release_date":"2026-02-23","model_type":"video","page_url":"https://fal.run/fal-ai/heygen/avatar4/image-to-video","tagline":"Heygen Photo Avatar 4 Model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/avatar5/digital-twin","name":"Heygen v5 Digital Twin","created_by":"fal","source":"official","description":"Create natural HeyGen Avatar V digital twin videos from text or audio, with lip-sync, optional backgrounds, captions, and MP4/WebM output.","status":"active","release_date":"2026-05-17","model_type":"video","page_url":"https://fal.run/fal-ai/heygen/avatar5/digital-twin","tagline":"Create natural HeyGen Avatar V digital twin videos from text or audio, with lip-sync, optional backgrounds, captions, and MP4/WebM output.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-05-20","last_updated":"2026-06-03"},{"id":"fal-ai/heygen/v2/translate/precision","name":"Heygen","created_by":"fal","source":"official","description":"Heygen Translate Model with Extreme Precision","status":"active","release_date":"2026-02-23","model_type":"other","page_url":"https://fal.run/fal-ai/heygen/v2/translate/precision","tagline":"Heygen Translate Model with Extreme Precision","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/v2/translate/speed","name":"Heygen","created_by":"fal","source":"official","description":"Heygen Translate Model with Extreme Speed","status":"active","release_date":"2026-02-23","model_type":"other","page_url":"https://fal.run/fal-ai/heygen/v2/translate/speed","tagline":"Heygen Translate Model with Extreme Speed","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/v2/video-agent","name":"Heygen","created_by":"fal","source":"official","description":"Heygen Text to Video Generation Model","status":"active","release_date":"2026-02-15","model_type":"video","page_url":"https://fal.run/fal-ai/heygen/v2/video-agent","tagline":"Heygen Text to Video Generation Model","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/v3/lipsync/precision","name":"Heygen Lipsync - Precision","created_by":"fal","source":"official","description":"Replace or dub audio on an existing video with high-accuracy avatar-inference lip-sync.","status":"active","release_date":"2026-04-14","model_type":"other","page_url":"https://fal.run/fal-ai/heygen/v3/lipsync/precision","tagline":"Replace or dub audio on an existing video with high-accuracy avatar-inference lip-sync.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/v3/lipsync/speed","name":"Heygen Lipsync - Speed","created_by":"fal","source":"official","description":"Replace or dub audio on an existing video with fast audio-only lip-sync.","status":"active","release_date":"2026-04-14","model_type":"other","page_url":"https://fal.run/fal-ai/heygen/v3/lipsync/speed","tagline":"Replace or dub audio on an existing video with fast audio-only lip-sync.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/heygen/v3/video-agent","name":"Heygen Video Agent","created_by":"fal","source":"official","description":"Generate videos with a single prompt.","status":"active","release_date":"2026-04-16","model_type":"video","page_url":"https://fal.run/fal-ai/heygen/v3/video-agent","tagline":"Generate videos with a single prompt.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/hidream-e1-1","name":"Hidream E1 1","created_by":"fal","source":"official","description":"Edit images with natural language","status":"active","release_date":"2025-07-23","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-e1-1","tagline":"Edit images with natural language","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hidream-i1-dev","name":"Hidream I1 Dev","created_by":"fal","source":"official","description":"HiDream-I1 dev is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within seconds.","status":"active","release_date":"2025-04-11","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-i1-dev","tagline":"HiDream-I1 dev is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within seconds.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hidream-i1-fast","name":"Hidream I1 Fast","created_by":"fal","source":"official","description":"HiDream-I1 fast is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within 16 steps.","status":"active","release_date":"2025-04-11","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-i1-fast","tagline":"HiDream-I1 fast is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within 16 steps.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hidream-i1-full/image-to-image","name":"Hidream I1 Full","created_by":"fal","source":"official","description":"HiDream-I1 full is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within seconds.","status":"active","release_date":"2025-05-05","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-i1-full/image-to-image","tagline":"HiDream-I1 full is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within seconds.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hidream-i1-full","name":"Hidream I1 Full","created_by":"fal","source":"official","description":"HiDream-I1 full is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within seconds.","status":"active","release_date":"2025-04-11","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-i1-full","tagline":"HiDream-I1 full is a new open-source image generative foundation model with 17B parameters that achieves state-of-the-art image generation quality within seconds.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hidream-o1-image/dev/edit","name":"Hidream O1 Image","created_by":"fal","source":"official","description":"Unified image generation with HiDream-O1-Image.","status":"active","release_date":"2026-05-09","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-o1-image/dev/edit","tagline":"Unified image generation with HiDream-O1-Image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-10","last_updated":"2026-05-11"},{"id":"fal-ai/hidream-o1-image/dev","name":"Hidream O1 Image","created_by":"fal","source":"official","description":"Unified image generation with HiDream-O1-Image.","status":"active","release_date":"2026-05-09","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-o1-image/dev","tagline":"Unified image generation with HiDream-O1-Image.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-10","last_updated":"2026-05-11"},{"id":"fal-ai/hidream-o1-image/edit","name":"Hidream O1 Image","created_by":"fal","source":"official","description":"Unified image generation with HiDream-O1-Image.","status":"active","release_date":"2026-05-09","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-o1-image/edit","tagline":"Unified image generation with HiDream-O1-Image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-10","last_updated":"2026-05-11"},{"id":"fal-ai/hidream-o1-image","name":"Hidream O1 Image","created_by":"fal","source":"official","description":"Unified image generation with HiDream-O1-Image.","status":"active","release_date":"2026-05-09","model_type":"image","page_url":"https://fal.run/fal-ai/hidream-o1-image","tagline":"Unified image generation with HiDream-O1-Image.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-10","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-3d/v3.1/part","name":"Hunyuan 3D Part Splitter","created_by":"fal","source":"official","description":"Split 3D models into parts with Hunyuan 3D","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-3d/v3.1/part","tagline":"Split 3D models into parts with Hunyuan 3D","last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-3d/v3.1/pro/image-to-3d","name":"Hunyuan 3D Pro Image to 3D","created_by":"fal","source":"official","description":"Generate 3D models from images with Hunyuan 3D Pro","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-3d/v3.1/pro/image-to-3d","tagline":"Generate 3D models from images with Hunyuan 3D Pro","capabilities":{"vision":true},"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-3d/v3.1/pro/text-to-3d","name":"Hunyuan 3D Pro Text to 3D","created_by":"fal","source":"official","description":"Generate 3D models from text prompts with Hunyuan 3D Pro","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-3d/v3.1/pro/text-to-3d","tagline":"Generate 3D models from text prompts with Hunyuan 3D Pro","last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-3d/v3.1/rapid/image-to-3d","name":"Hunyuan 3D Rapid Image to 3D","created_by":"fal","source":"official","description":"Rapidly generate 3D models from images using Hunyuan 3D.","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-3d/v3.1/rapid/image-to-3d","tagline":"Rapidly generate 3D models from images using Hunyuan 3D.","capabilities":{"vision":true},"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-3d/v3.1/rapid/text-to-3d","name":"Hunyuan 3d","created_by":"fal","source":"official","description":"Create detailed, fully-textured 3D models with text","status":"active","release_date":"2026-01-29","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-3d/v3.1/rapid/text-to-3d","tagline":"Create detailed, fully-textured 3D models with text","last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-3d/v3.1/smart-topology","name":"Hunyuan 3D Smart Topology","created_by":"fal","source":"official","description":"Optimize 3D mesh topology with Hunyuan 3D Smart Topology.","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-3d/v3.1/smart-topology","tagline":"Optimize 3D mesh topology with Hunyuan 3D Smart Topology.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-avatar","name":"Hunyuan Avatar","created_by":"fal","source":"official","description":"HunyuanAvatar is a High-Fidelity Audio-Driven Human Animation model for Multiple Characters .","status":"active","release_date":"2025-05-29","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-avatar","tagline":"HunyuanAvatar is a High-Fidelity Audio-Driven Human Animation model for Multiple Characters .","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-custom","name":"Hunyuan Custom","created_by":"fal","source":"official","description":"HunyuanCustom revolutionizes video generation with unmatched identity consistency across multiple input types.","status":"active","release_date":"2025-05-14","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-custom","tagline":"HunyuanCustom revolutionizes video generation with unmatched identity consistency across multiple input types.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-image/v2.1/text-to-image","name":"Hunyuan Image","created_by":"fal","source":"official","description":"Use the amazing capabilities of hunyuan image 2.1 to generate images that express the feelings of your text.","status":"active","release_date":"2025-09-09","model_type":"image","page_url":"https://fal.run/fal-ai/hunyuan-image/v2.1/text-to-image","tagline":"Use the amazing capabilities of hunyuan image 2.1 to generate images that express the feelings of your text.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hunyuan-image/v3/instruct/edit","name":"Hunyuan Image","created_by":"fal","source":"official","description":"Image editing endpoint for Hunyuan Image 3.0 Instruct.","status":"active","release_date":"2026-01-28","model_type":"image","page_url":"https://fal.run/fal-ai/hunyuan-image/v3/instruct/edit","tagline":"Image editing endpoint for Hunyuan Image 3.0 Instruct.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-28","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-image/v3/instruct/text-to-image","name":"Hunyuan Image 3.0 Instruct","created_by":"fal","source":"official","description":"Instruct version of Hunyuan-Image 3.0, with internal reasoning capabilities.","status":"active","release_date":"2026-01-28","model_type":"image","page_url":"https://fal.run/fal-ai/hunyuan-image/v3/instruct/text-to-image","tagline":"Instruct version of Hunyuan-Image 3.0, with internal reasoning capabilities.","capabilities":{"vision":true,"reasoning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-14","last_updated":"2026-06-03"},{"id":"fal-ai/hunyuan-image/v3/text-to-image","name":"Hunyuan Image","created_by":"fal","source":"official","description":"Leverage the state-of-the-art capabilities of Hunyuan Image 3.0 to generate visual content that effectively conveys the messaging of your written material.","status":"active","release_date":"2025-09-28","model_type":"image","page_url":"https://fal.run/fal-ai/hunyuan-image/v3/text-to-image","tagline":"Leverage the state-of-the-art capabilities of Hunyuan Image 3.0 to generate visual content that effectively conveys the messaging of your written material.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-motion/fast","name":"Hunyuan Motion [0.46B]","created_by":"fal","source":"official","description":"Generate 3D human motions via text-to-generation interface of Hunyuan Motion!","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-motion/fast","tagline":"Generate 3D human motions via text-to-generation interface of Hunyuan Motion!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-motion","name":"Hunyuan Motion [1B]","created_by":"fal","source":"official","description":"Generate 3D human motions via text-to-generation interface of Hunyuan Motion!","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-motion","tagline":"Generate 3D human motions via text-to-generation interface of Hunyuan Motion!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-part","name":"Hunyuan Part","created_by":"fal","source":"official","description":"Use the capabilities of hunyuan part to generate point clouds from your 3D files.","status":"active","release_date":"2025-10-08","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-part","tagline":"Use the capabilities of hunyuan part to generate point clouds from your 3D files.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-portrait","name":"Hunyuan Portrait","created_by":"fal","source":"official","description":"HunyuanPortrait is a diffusion-based framework for generating lifelike, temporally consistent portrait animations.","status":"active","release_date":"2025-05-27","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-portrait","tagline":"HunyuanPortrait is a diffusion-based framework for generating lifelike, temporally consistent portrait animations.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video-foley","name":"Hunyuan Video Foley","created_by":"fal","source":"official","description":"Use the capabilities of the hunyuan foley model to bring life to your videos by adding sound effect to them.","status":"active","release_date":"2025-09-08","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-video-foley","tagline":"Use the capabilities of the hunyuan foley model to bring life to your videos by adding sound effect to them.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hunyuan-video-image-to-video","name":"Hunyuan Video Image-to-Video Inference","created_by":"fal","source":"official","description":"Image to Video for the high-quality Hunyuan Video I2V model.","status":"active","release_date":"2025-03-06","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-video-image-to-video","tagline":"Image to Video for the high-quality Hunyuan Video I2V model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video-img2vid-lora","name":"Hunyuan Video Image-to-Video LoRA Inference","created_by":"fal","source":"official","description":"Image to Video for the Hunyuan Video model using a custom trained LoRA.","status":"active","release_date":"2025-02-03","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-video-img2vid-lora","tagline":"Image to Video for the Hunyuan Video model using a custom trained LoRA.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video-lora-training","name":"Train Hunyuan LoRA","created_by":"fal","source":"official","description":"Train Hunyuan Video lora on people, objects, characters and more!","status":"active","release_date":"2025-01-14","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-video-lora-training","tagline":"Train Hunyuan Video lora on people, objects, characters and more!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video-lora/video-to-video","name":"Hunyuan Video LoRA Inference (Video-to-Video)","created_by":"fal","source":"official","description":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability.","status":"active","release_date":"2025-01-30","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-video-lora/video-to-video","tagline":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video-lora","name":"Hunyuan Video LoRA Inference","created_by":"fal","source":"official","description":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability","status":"active","release_date":"2025-01-16","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-video-lora","tagline":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video-v1.5/image-to-video","name":"Hunyuan Video V1.5","created_by":"fal","source":"official","description":"Hunyuan Video 1.5 is Tencent's latest and best video model","status":"active","release_date":"2025-12-17","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-video-v1.5/image-to-video","tagline":"Hunyuan Video 1.5 is Tencent's latest and best video model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video-v1.5/text-to-video","name":"Hunyuan Video V1.5","created_by":"fal","source":"official","description":"Hunyuan Video 1.5 is Tencent's latest and best video model","status":"active","release_date":"2025-11-21","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-video-v1.5/text-to-video","tagline":"Hunyuan Video 1.5 is Tencent's latest and best video model","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video/video-to-video","name":"Hunyuan Video (Video-to-Video)","created_by":"fal","source":"official","description":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability.","status":"active","release_date":"2025-01-30","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan-video/video-to-video","tagline":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan-video","name":"Hunyuan Video","created_by":"fal","source":"official","description":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability.","status":"active","release_date":"2024-10-22","model_type":"video","page_url":"https://fal.run/fal-ai/hunyuan-video","tagline":"Hunyuan Video is an Open video generation model with high visual quality, motion diversity, text-video alignment, and generation stability.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan3d/v2/mini/turbo","name":"Hunyuan3D","created_by":"fal","source":"official","description":"Generate 3D models from your images using Hunyuan 3D.","status":"active","release_date":"2025-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d/v2/mini/turbo","tagline":"Generate 3D models from your images using Hunyuan 3D.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan3d/v2/mini","name":"Hunyuan3D","created_by":"fal","source":"official","description":"Generate 3D models from your images using Hunyuan 3D.","status":"active","release_date":"2025-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d/v2/mini","tagline":"Generate 3D models from your images using Hunyuan 3D.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan3d/v2/multi-view/turbo","name":"Hunyuan3D","created_by":"fal","source":"official","description":"Generate 3D models from your images using Hunyuan 3D.","status":"active","release_date":"2025-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d/v2/multi-view/turbo","tagline":"Generate 3D models from your images using Hunyuan 3D.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan3d/v2/multi-view","name":"Hunyuan3D","created_by":"fal","source":"official","description":"Generate 3D models from your images using Hunyuan 3D.","status":"active","release_date":"2025-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d/v2/multi-view","tagline":"Generate 3D models from your images using Hunyuan 3D.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan3d/v2/turbo","name":"Hunyuan3D","created_by":"fal","source":"official","description":"Generate 3D models from your images using Hunyuan 3D.","status":"active","release_date":"2025-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d/v2/turbo","tagline":"Generate 3D models from your images using Hunyuan 3D.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan3d/v2","name":"Hunyuan3D","created_by":"fal","source":"official","description":"Generate 3D models from your images using Hunyuan 3D.","status":"active","release_date":"2025-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d/v2","tagline":"Generate 3D models from your images using Hunyuan 3D.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan3d-v3/image-to-3d","name":"Hunyuan3d V3","created_by":"fal","source":"official","description":"Transform your photos into ultra-high-resolution 3D models in seconds.","status":"active","release_date":"2025-12-16","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d-v3/image-to-3d","tagline":"Transform your photos into ultra-high-resolution 3D models in seconds.","capabilities":{"vision":true},"last_seen_at":"2026-06-02","last_updated":"2026-06-03"},{"id":"fal-ai/hunyuan3d-v3/sketch-to-3d","name":"Hunyuan3d V3","created_by":"fal","source":"official","description":"Create your imagined 3D models with just text.","status":"active","release_date":"2025-12-16","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d-v3/sketch-to-3d","tagline":"Create your imagined 3D models with just text.","capabilities":{"vision":true},"last_seen_at":"2026-06-02","last_updated":"2026-06-03"},{"id":"fal-ai/hunyuan3d-v3/text-to-3d","name":"Hunyuan3d V3","created_by":"fal","source":"official","description":"Turn simple sketches into detailed, fully-textured 3D models.","status":"active","release_date":"2025-12-16","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan3d-v3/text-to-3d","tagline":"Turn simple sketches into detailed, fully-textured 3D models.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hunyuan_world/image-to-world","name":"Hunyuan World","created_by":"fal","source":"official","description":"Hunyuan World 1.0 turns a single image into a panorama or a 3D world.","status":"active","release_date":"2025-07-28","model_type":"other","page_url":"https://fal.run/fal-ai/hunyuan_world/image-to-world","tagline":"Hunyuan World 1.0 turns a single image into a panorama or a 3D world.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hunyuan_world","name":"Hunyuan World","created_by":"fal","source":"official","description":"Hunyuan World 1.0 turns a single image into a panorama or a 3D world.","status":"active","release_date":"2025-07-28","model_type":"image","page_url":"https://fal.run/fal-ai/hunyuan_world","tagline":"Hunyuan World 1.0 turns a single image into a panorama or a 3D world.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hy-wu-edit","name":"Hy Wu Edit","created_by":"fal","source":"official","description":"Image editing with HY-WU.","status":"active","release_date":"2026-03-25","model_type":"image","page_url":"https://fal.run/fal-ai/hy-wu-edit","tagline":"Image editing with HY-WU.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/hyper-sdxl/image-to-image","name":"Hyper SDXL","created_by":"fal","source":"official","description":"Hyper-charge SDXL's performance and creativity.","status":"active","release_date":"2024-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/hyper-sdxl/image-to-image","tagline":"Hyper-charge SDXL's performance and creativity.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/hyper-sdxl/inpainting","name":"Hyper SDXL","created_by":"fal","source":"official","description":"Hyper-charge SDXL's performance and creativity.","status":"active","release_date":"2024-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/hyper-sdxl/inpainting","tagline":"Hyper-charge SDXL's performance and creativity.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/hyper-sdxl","name":"Hyper SDXL","created_by":"fal","source":"official","description":"Hyper-charge SDXL's performance and creativity.","status":"active","release_date":"2024-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/hyper-sdxl","tagline":"Hyper-charge SDXL's performance and creativity.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/hyper3d/rodin/v2.5/fast","name":"Hyper3D - Rodin V2.5 - Image to 3D - Fast","created_by":"fal","source":"official","description":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","status":"active","release_date":"2026-06-05","model_type":"other","page_url":"https://fal.run/fal-ai/hyper3d/rodin/v2.5/fast","tagline":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","capabilities":{"vision":true},"last_seen_at":"2026-06-29","last_updated":"2026-06-30"},{"id":"fal-ai/hyper3d/rodin/v2.5/text-to-3d/fast","name":"Hyper3D - Rodin V2.5 - Text to 3D - Fast","created_by":"fal","source":"official","description":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","status":"active","release_date":"2026-06-05","model_type":"other","page_url":"https://fal.run/fal-ai/hyper3d/rodin/v2.5/text-to-3d/fast","tagline":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","capabilities":{"vision":true},"last_seen_at":"2026-06-29","last_updated":"2026-06-30"},{"id":"fal-ai/hyper3d/rodin/v2.5/text-to-3d","name":"Hyper3D - Rodin V2.5 - Text to 3D","created_by":"fal","source":"official","description":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","status":"active","release_date":"2026-05-28","model_type":"other","page_url":"https://fal.run/fal-ai/hyper3d/rodin/v2.5/text-to-3d","tagline":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hyper3d/rodin/v2.5","name":"Hyper3D - Rodin V2.5 - Image to 3D","created_by":"fal","source":"official","description":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","status":"active","release_date":"2026-05-28","model_type":"other","page_url":"https://fal.run/fal-ai/hyper3d/rodin/v2.5","tagline":"Rodin V2.5 by Hyper3D generates realistic and production ready 3D models from text or images.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/hyper3d/rodin/v2","name":"Hyper3d","created_by":"fal","source":"official","description":"Rodin by Hyper3D generates realistic and production ready 3D models from text or images.","status":"active","release_date":"2025-09-26","model_type":"other","page_url":"https://fal.run/fal-ai/hyper3d/rodin/v2","tagline":"Rodin by Hyper3D generates realistic and production ready 3D models from text or images.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/hyper3d/rodin","name":"Hyper3D Rodin","created_by":"fal","source":"official","description":"Rodin by Hyper3D generates realistic and production ready 3D models from text or images.","status":"active","release_date":"2024-12-16","model_type":"other","page_url":"https://fal.run/fal-ai/hyper3d/rodin","tagline":"Rodin by Hyper3D generates realistic and production ready 3D models from text or images.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/iclight-v2","name":"IC-Light-v2 for Image Relighting","created_by":"fal","source":"official","description":"An endpoint for re-lighting photos and changing their backgrounds per a given description","status":"active","release_date":"2024-11-14","model_type":"image","page_url":"https://fal.run/fal-ai/iclight-v2","tagline":"An endpoint for re-lighting photos and changing their backgrounds per a given description","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/character/edit","name":"Ideogram V3 Character Edit","created_by":"fal","source":"official","description":"Modify consistent characters while preserving their core identity.","status":"active","release_date":"2025-08-07","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/character/edit","tagline":"Modify consistent characters while preserving their core identity.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/character/remix","name":"Ideogram V3 Character Remix","created_by":"fal","source":"official","description":"Transform your consistent character into different art styles, settings, or scenarios while maintaining their distinctive appearance and identity","status":"active","release_date":"2025-08-07","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/character/remix","tagline":"Transform your consistent character into different art styles, settings, or scenarios while maintaining their distinctive appearance and identity","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/character","name":"Ideogram V3 Character","created_by":"fal","source":"official","description":"Generate consistent character appearances across multiple images.","status":"active","release_date":"2025-08-07","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/character","tagline":"Generate consistent character appearances across multiple images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/custom-models/generate","name":"Ideogram","created_by":"fal","source":"official","description":"Train Ideogram on your photos, your style, your subject, your look, from a small set of reference images to images that feel consistently yours ","status":"active","release_date":"2026-04-22","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/custom-models/generate","tagline":"Train Ideogram on your photos, your style, your subject, your look, from a small set of reference images to images that feel consistently yours ","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/custom-models","name":"Ideogram","created_by":"fal","source":"official","description":"Train Ideogram on your photos, your style, your subject, your look, from a small set of reference images to images that feel consistently yours ","status":"active","release_date":"2026-04-22","model_type":"other","page_url":"https://fal.run/fal-ai/ideogram/custom-models","tagline":"Train Ideogram on your photos, your style, your subject, your look, from a small set of reference images to images that feel consistently yours ","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/remove-background","name":"Ideogram Remove Background","created_by":"fal","source":"official","description":"Remove backgrounds from existing images with Ideogram's remove background feature.","status":"active","release_date":"2026-05-07","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/remove-background","tagline":"Remove backgrounds from existing images with Ideogram's remove background feature.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-13","last_updated":"2026-06-03"},{"id":"fal-ai/ideogram/upscale","name":"Ideogram Upscale","created_by":"fal","source":"official","description":"Ideogram Upscale enhances the resolution of the reference image by up to 2X and might enhance the reference image too.","status":"active","release_date":"2025-02-10","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/upscale","tagline":"Ideogram Upscale enhances the resolution of the reference image by up to 2X and might enhance the reference image too.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2/edit","name":"Ideogram V2 Edit","created_by":"fal","source":"official","description":"Transform existing images with Ideogram V2's editing capabilities.","status":"active","release_date":"2024-12-14","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2/edit","tagline":"Transform existing images with Ideogram V2's editing capabilities.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2/remix","name":"Ideogram V2 Remix","created_by":"fal","source":"official","description":"Reimagine existing images with Ideogram V2's remix feature.","status":"active","release_date":"2024-12-04","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2/remix","tagline":"Reimagine existing images with Ideogram V2's remix feature.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2/turbo/edit","name":"Ideogram V2 Turbo Edit","created_by":"fal","source":"official","description":"Edit images faster with Ideogram V2 Turbo.","status":"active","release_date":"2024-12-04","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2/turbo/edit","tagline":"Edit images faster with Ideogram V2 Turbo.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2/turbo/remix","name":"Ideogram V2 Turbo Remix","created_by":"fal","source":"official","description":"Rapidly create image variations with Ideogram V2 Turbo Remix.","status":"active","release_date":"2024-12-04","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2/turbo/remix","tagline":"Rapidly create image variations with Ideogram V2 Turbo Remix.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2/turbo","name":"Ideogram V2 Turbo","created_by":"fal","source":"official","description":"Accelerated image generation with Ideogram V2 Turbo.","status":"active","release_date":"2024-12-04","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2/turbo","tagline":"Accelerated image generation with Ideogram V2 Turbo.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2","name":"Ideogram V2","created_by":"fal","source":"official","description":"Generate high-quality images, posters, and logos with Ideogram V2.","status":"active","release_date":"2024-12-04","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2","tagline":"Generate high-quality images, posters, and logos with Ideogram V2.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/v2a/remix","name":"Ideogram V2A Remix","created_by":"fal","source":"official","description":"Create variations of existing images with Ideogram V2A Remix while maintaining creative control through prompt guidance.","status":"active","release_date":"2025-02-27","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2a/remix","tagline":"Create variations of existing images with Ideogram V2A Remix while maintaining creative control through prompt guidance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2a/turbo/remix","name":"Ideogram V2A Turbo Remix","created_by":"fal","source":"official","description":"Rapidly create image variations with Ideogram V2A Turbo Remix.","status":"active","release_date":"2025-02-27","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2a/turbo/remix","tagline":"Rapidly create image variations with Ideogram V2A Turbo Remix.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v2a/turbo","name":"Ideogram V2A Turbo","created_by":"fal","source":"official","description":"Accelerated image generation with Ideogram V2A Turbo.","status":"active","release_date":"2025-02-27","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2a/turbo","tagline":"Accelerated image generation with Ideogram V2A Turbo.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/v2a","name":"Ideogram V2A","created_by":"fal","source":"official","description":"Generate high-quality images, posters, and logos with Ideogram V2A.","status":"active","release_date":"2025-02-27","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v2a","tagline":"Generate high-quality images, posters, and logos with Ideogram V2A.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/v3/edit","name":"Ideogram V3 Edit","created_by":"fal","source":"official","description":"Transform existing images with Ideogram V3's editing capabilities.","status":"active","release_date":"2025-05-01","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v3/edit","tagline":"Transform existing images with Ideogram V3's editing capabilities.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v3/generate-transparent","name":"Ideogram Transparent","created_by":"fal","source":"official","description":"Generate images with transparent backgrounds using Ideogram Transparent model","status":"active","release_date":"2026-04-07","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v3/generate-transparent","tagline":"Generate images with transparent backgrounds using Ideogram Transparent model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v3/layerize-text","name":"Ideogram","created_by":"fal","source":"official","description":"Ideogram Layerize takes an existing flat graphic, removes text, and returns structured text containers you can edit/recompose in html or json format.","status":"active","release_date":"2026-04-07","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v3/layerize-text","tagline":"Ideogram Layerize takes an existing flat graphic, removes text, and returns structured text containers you can edit/recompose in html or json format.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/ideogram/v3/reframe","name":"Ideogram","created_by":"fal","source":"official","description":"Extend existing images with Ideogram V3's reframe feature.","status":"active","release_date":"2025-05-01","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v3/reframe","tagline":"Extend existing images with Ideogram V3's reframe feature.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/v3/remix","name":"Ideogram","created_by":"fal","source":"official","description":"Reimagine existing images with Ideogram V3's remix feature.","status":"active","release_date":"2025-05-01","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v3/remix","tagline":"Reimagine existing images with Ideogram V3's remix feature.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/v3/replace-background","name":"Ideogram Replace Background","created_by":"fal","source":"official","description":"Replace backgrounds existing images with Ideogram V3's replace background feature.","status":"active","release_date":"2025-05-01","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v3/replace-background","tagline":"Replace backgrounds existing images with Ideogram V3's replace background feature.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ideogram/v3","name":"Ideogram Text to Image","created_by":"fal","source":"official","description":"Generate high-quality images, posters, and logos with Ideogram V3.","status":"active","release_date":"2025-05-01","model_type":"image","page_url":"https://fal.run/fal-ai/ideogram/v3","tagline":"Generate high-quality images, posters, and logos with Ideogram V3.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/illusion-diffusion","name":"Illusion Diffusion","created_by":"fal","source":"official","description":"Create illusions conditioned on image.","status":"active","release_date":"2024-02-13","model_type":"image","page_url":"https://fal.run/fal-ai/illusion-diffusion","tagline":"Create illusions conditioned on image.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/age-modify","name":"Age Modify","created_by":"fal","source":"official","description":"Modify a face to look younger or older while keeping identity realistic.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/age-modify","tagline":"Modify a face to look younger or older while keeping identity realistic.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-apps-v2/city-teleport","name":"City Teleport","created_by":"fal","source":"official","description":"Place a person’s photo into iconic cities worldwide.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/city-teleport","tagline":"Place a person’s photo into iconic cities worldwide.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-apps-v2/expression-change","name":"Expression Change","created_by":"fal","source":"official","description":"Change facial expressions in photos with realistic results.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/expression-change","tagline":"Change facial expressions in photos with realistic results.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-apps-v2/hair-change","name":"Hair Change","created_by":"fal","source":"official","description":"Change hairstyles and hair colors in photos realistically.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/hair-change","tagline":"Change hairstyles and hair colors in photos realistically.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-apps-v2/headshot-photo","name":"Headshot Generator","created_by":"fal","source":"official","description":"Generate professional headshot photos with customizable backgrounds.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/headshot-photo","tagline":"Generate professional headshot photos with customizable backgrounds.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-apps-v2/makeup-application","name":"Makeup Changer","created_by":"fal","source":"official","description":"Apply realistic makeup styles with adjustable intensity.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/makeup-application","tagline":"Apply realistic makeup styles with adjustable intensity.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-apps-v2/object-removal","name":"Object Removal","created_by":"fal","source":"official","description":"Remove unwanted objects seamlessly from any image.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/object-removal","tagline":"Remove unwanted objects seamlessly from any image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-apps-v2/outpaint","name":"Image Outpaint","created_by":"fal","source":"official","description":"Directional outpainting.","status":"active","release_date":"2025-11-03","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/outpaint","tagline":"Directional outpainting.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/perspective","name":"Perspective Change","created_by":"fal","source":"official","description":"Easily adjust the perspective of any image to different angles.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/perspective","tagline":"Easily adjust the perspective of any image to different angles.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/photo-restoration","name":"Photo Restoration","created_by":"fal","source":"official","description":"Restore old or damaged photos by fixing colors, scratches, and resolution.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/photo-restoration","tagline":"Restore old or damaged photos by fixing colors, scratches, and resolution.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/photography-effects","name":"Photography Effects","created_by":"fal","source":"official","description":"Apply diverse photography styles and effects to transform your images.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/photography-effects","tagline":"Apply diverse photography styles and effects to transform your images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/portrait-enhance","name":"Portrait Enhance","created_by":"fal","source":"official","description":"Enhance and refine portrait photos with improved clarity and detail.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/portrait-enhance","tagline":"Enhance and refine portrait photos with improved clarity and detail.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/product-holding","name":"Product Holding","created_by":"fal","source":"official","description":"Place products naturally in a person’s hands for realistic marketing visuals.","status":"active","release_date":"2025-09-19","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/product-holding","tagline":"Place products naturally in a person’s hands for realistic marketing visuals.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/product-photography","name":"Product Photography","created_by":"fal","source":"official","description":"Generate professional product photography with realistic lighting and backgrounds.","status":"active","release_date":"2025-09-19","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/product-photography","tagline":"Generate professional product photography with realistic lighting and backgrounds.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/relighting","name":"Relighting","created_by":"fal","source":"official","description":"Adjust and enhance images with different lighting styles.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/relighting","tagline":"Adjust and enhance images with different lighting styles.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/style-transfer","name":"Style Transfer","created_by":"fal","source":"official","description":"Apply artistic styles like impressionism, cubism, or surrealism to your images.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/style-transfer","tagline":"Apply artistic styles like impressionism, cubism, or surrealism to your images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/texture-transform","name":"Texture Transform","created_by":"fal","source":"official","description":"Transform objects with different surface textures like marble, wood, or fabric.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/texture-transform","tagline":"Transform objects with different surface textures like marble, wood, or fabric.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-apps-v2/virtual-try-on","name":"Virtual Try-on","created_by":"fal","source":"official","description":"Try on clothes virtually by combining person and clothing images.","status":"active","release_date":"2025-09-18","model_type":"image","page_url":"https://fal.run/fal-ai/image-apps-v2/virtual-try-on","tagline":"Try on clothes virtually by combining person and clothing images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-editing/age-progression","name":"Image Editing Age Progression","created_by":"fal","source":"official","description":"See how you or others might look at different ages, from younger to older, while preserving core facial features.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/age-progression","tagline":"See how you or others might look at different ages, from younger to older, while preserving core facial features.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/baby-version","name":"Image Editing","created_by":"fal","source":"official","description":"Transform any person into their baby version, while preserving the original pose and expression with childlike features.","status":"active","release_date":"2025-06-03","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/baby-version","tagline":"Transform any person into their baby version, while preserving the original pose and expression with childlike features.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-editing/background-change","name":"Image Editing Background Change","created_by":"fal","source":"official","description":"Replace your photo's background with any scene you desire, from beach sunsets to urban landscapes, with perfect lighting and shadows","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/background-change","tagline":"Replace your photo's background with any scene you desire, from beach sunsets to urban landscapes, with perfect lighting and shadows","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/broccoli-haircut","name":"Image Editing Broccoli Haircut","created_by":"fal","source":"official","description":"Transform your character's hair into broccoli style while keeping the original characters likeness","status":"active","release_date":"2025-06-26","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/broccoli-haircut","tagline":"Transform your character's hair into broccoli style while keeping the original characters likeness","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-editing/cartoonify","name":"Image Editing Cartoonify","created_by":"fal","source":"official","description":"Transform your photos into vibrant cool cartoons with bold outlines and rich colors.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/cartoonify","tagline":"Transform your photos into vibrant cool cartoons with bold outlines and rich colors.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/color-correction","name":"Image Editing Color Correction","created_by":"fal","source":"official","description":"Perfect your photos with professional color grading, balanced tones, and vibrant yet natural colors","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/color-correction","tagline":"Perfect your photos with professional color grading, balanced tones, and vibrant yet natural colors","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/expression-change","name":"Image Editing Expression Change","created_by":"fal","source":"official","description":"Change facial expressions in photos to any emotion you desire, from smiles to serious looks.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/expression-change","tagline":"Change facial expressions in photos to any emotion you desire, from smiles to serious looks.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/face-enhancement","name":"Image Editing Face Enhancement","created_by":"fal","source":"official","description":"Enhance facial features with professional retouching while maintaining a natural, realistic look","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/face-enhancement","tagline":"Enhance facial features with professional retouching while maintaining a natural, realistic look","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/hair-change","name":"Image Editing Hair Change","created_by":"fal","source":"official","description":"Experiment with different hairstyles, from bald to any style you can imagine, while maintaining natural lighting and realistic results.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/hair-change","tagline":"Experiment with different hairstyles, from bald to any style you can imagine, while maintaining natural lighting and realistic results.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/object-removal","name":"Image Editing Object Removal","created_by":"fal","source":"official","description":"Remove unwanted objects or people from your photos while seamlessly blending the background.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/object-removal","tagline":"Remove unwanted objects or people from your photos while seamlessly blending the background.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-01","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/photo-restoration","name":"Image Editing Photo Restoration","created_by":"fal","source":"official","description":"Restore and enhance old or damaged photos by removing imperfections, adding color while preserving the original character and details of the image.","status":"active","release_date":"2025-06-02","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/photo-restoration","tagline":"Restore and enhance old or damaged photos by removing imperfections, adding color while preserving the original character and details of the image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/plushie-style","name":"Image Editing Plushie Style","created_by":"fal","source":"official","description":"Transform your photos into cool plushies while keeping the original characters likeness","status":"active","release_date":"2025-06-26","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/plushie-style","tagline":"Transform your photos into cool plushies while keeping the original characters likeness","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/professional-photo","name":"Image Editing Professional Photo","created_by":"fal","source":"official","description":"Turn your casual photos into stunning professional studio portraits with perfect lighting and high-end photography style.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/professional-photo","tagline":"Turn your casual photos into stunning professional studio portraits with perfect lighting and high-end photography style.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/realism","name":"Image Editing Realism","created_by":"fal","source":"official","description":"Add details to faces, enhance face features, remove blur.","status":"active","release_date":"2025-07-07","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/realism","tagline":"Add details to faces, enhance face features, remove blur.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/reframe","name":"Image Editing Reframe","created_by":"fal","source":"official","description":"The reframe endpoint intelligently adjusts an image's aspect ratio while preserving the main subject's position, composition, pose, and perspective","status":"active","release_date":"2025-06-05","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/reframe","tagline":"The reframe endpoint intelligently adjusts an image's aspect ratio while preserving the main subject's position, composition, pose, and perspective","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/retouch","name":"Image Editing Retouch","created_by":"fal","source":"official","description":"Retouch photos of faces.","status":"active","release_date":"2025-07-24","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/retouch","tagline":"Retouch photos of faces.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/scene-composition","name":"Image Editing Scene Composition","created_by":"fal","source":"official","description":"Place your subject in any scene you imagine, from enchanted forests to urban settings, with professional composition and lighting","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/scene-composition","tagline":"Place your subject in any scene you imagine, from enchanted forests to urban settings, with professional composition and lighting","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/style-transfer","name":"Image Editing Style Transfer","created_by":"fal","source":"official","description":"Transform your photos into artistic masterpieces inspired by famous styles like Van Gogh's Starry Night or any artistic style you choose.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/style-transfer","tagline":"Transform your photos into artistic masterpieces inspired by famous styles like Van Gogh's Starry Night or any artistic style you choose.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/text-removal","name":"Image Editing Text Removal","created_by":"fal","source":"official","description":"Remove all text and writing from images while preserving the background and natural appearance.","status":"active","release_date":"2025-06-02","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/text-removal","tagline":"Remove all text and writing from images while preserving the background and natural appearance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/time-of-day","name":"Image Editing Time Of Day","created_by":"fal","source":"official","description":"Transform your photos to any time of day, from golden hour to midnight, with appropriate lighting and atmosphere.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/time-of-day","tagline":"Transform your photos to any time of day, from golden hour to midnight, with appropriate lighting and atmosphere.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/weather-effect","name":"Image Editing Weather Effect","created_by":"fal","source":"official","description":"Add realistic weather effects like snowfall, rain, or fog to your photos while maintaining the scene's mood.","status":"active","release_date":"2025-05-29","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/weather-effect","tagline":"Add realistic weather effects like snowfall, rain, or fog to your photos while maintaining the scene's mood.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/wojak-style","name":"Image Editing Wojak Style","created_by":"fal","source":"official","description":"Transform your photos into wojak style while keeping the original characters likeness","status":"active","release_date":"2025-06-26","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/wojak-style","tagline":"Transform your photos into wojak style while keeping the original characters likeness","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/image-editing/youtube-thumbnails","name":"Image Editing Youtube Thumbnails","created_by":"fal","source":"official","description":"Generate YouTube thumbnails with custom text","status":"active","release_date":"2025-06-30","model_type":"image","page_url":"https://fal.run/fal-ai/image-editing/youtube-thumbnails","tagline":"Generate YouTube thumbnails with custom text","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/image-preprocessors/depth-anything/v2","name":"Image Preprocessors","created_by":"fal","source":"official","description":"Depth Anything v2 preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/depth-anything/v2","tagline":"Depth Anything v2 preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/hed","name":"Image Preprocessors","created_by":"fal","source":"official","description":"Holistically-Nested Edge Detection (HED) preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/hed","tagline":"Holistically-Nested Edge Detection (HED) preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/lineart","name":"Image Preprocessors","created_by":"fal","source":"official","description":"Line art preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/lineart","tagline":"Line art preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/midas","name":"Image Preprocessors","created_by":"fal","source":"official","description":"MiDaS depth estimation preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/midas","tagline":"MiDaS depth estimation preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/mlsd","name":"Image Preprocessors","created_by":"fal","source":"official","description":"M-LSD line segment detection preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/mlsd","tagline":"M-LSD line segment detection preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/pidi","name":"Image Preprocessors","created_by":"fal","source":"official","description":"PIDI (Pidinet) preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/pidi","tagline":"PIDI (Pidinet) preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/sam","name":"Image Preprocessors","created_by":"fal","source":"official","description":"Segment Anything Model (SAM) preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/sam","tagline":"Segment Anything Model (SAM) preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/scribble","name":"Image Preprocessors","created_by":"fal","source":"official","description":"Scribble preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/scribble","tagline":"Scribble preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/teed","name":"Image Preprocessors","created_by":"fal","source":"official","description":"TEED (Temporal Edge Enhancement Detection) preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/teed","tagline":"TEED (Temporal Edge Enhancement Detection) preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image-preprocessors/zoe","name":"Image Preprocessors","created_by":"fal","source":"official","description":"ZoeDepth preprocessor.","status":"active","release_date":"2024-09-16","model_type":"image","page_url":"https://fal.run/fal-ai/image-preprocessors/zoe","tagline":"ZoeDepth preprocessor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image2pixel","name":"Image2Pixel","created_by":"fal","source":"official","description":"Turn images into pixel-perfect retro art","status":"active","release_date":"2025-10-14","model_type":"image","page_url":"https://fal.run/fal-ai/image2pixel","tagline":"Turn images into pixel-perfect retro art","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/image2svg","name":"Image2svg","created_by":"fal","source":"official","description":"Image2SVG transforms raster images into clean vector graphics, preserving visual quality while enabling scalable, customizable SVG outputs with precise control over detail levels.","status":"active","release_date":"2025-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/image2svg","tagline":"Image2SVG transforms raster images into clean vector graphics, preserving visual quality while enabling scalable, customizable SVG outputs with precise control over detail levels.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/imagen3/fast","name":"Imagen3 Fast","created_by":"fal","source":"official","family":"imagen","description":"Imagen3 Fast is a high-quality text-to-image model that generates realistic images from text prompts.","status":"active","release_date":"2025-02-10","model_type":"image","page_url":"https://fal.run/fal-ai/imagen3/fast","tagline":"Imagen3 Fast is a high-quality text-to-image model that generates realistic images from text prompts.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/imagen3","name":"Imagen3","created_by":"fal","source":"official","family":"imagen","description":"Imagen3 is a high-quality text-to-image model that generates realistic images from text prompts.","status":"active","release_date":"2025-02-10","model_type":"image","page_url":"https://fal.run/fal-ai/imagen3","tagline":"Imagen3 is a high-quality text-to-image model that generates realistic images from text prompts.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/imagen4/preview/fast","name":"Imagen 4","created_by":"fal","source":"official","family":"imagen","description":"Google’s highest quality image generation model","status":"active","release_date":"2025-06-12","model_type":"image","page_url":"https://fal.run/fal-ai/imagen4/preview/fast","tagline":"Google’s highest quality image generation model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/imagen4/preview/ultra","name":"Imagen 4 Ultra","created_by":"fal","source":"official","family":"imagen","description":"Google’s highest quality image generation model","status":"active","release_date":"2025-05-20","model_type":"image","page_url":"https://fal.run/fal-ai/imagen4/preview/ultra","tagline":"Google’s highest quality image generation model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/imagen4/preview","name":"Imagen 4","created_by":"fal","source":"official","family":"imagen","description":"Google’s highest quality image generation model","status":"active","release_date":"2025-05-20","model_type":"image","page_url":"https://fal.run/fal-ai/imagen4/preview","tagline":"Google’s highest quality image generation model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/imageutils/depth","name":"Midas Depth Estimation","created_by":"fal","source":"official","description":"Create depth maps using Midas depth estimation.","status":"active","release_date":"2024-02-13","model_type":"image","page_url":"https://fal.run/fal-ai/imageutils/depth","tagline":"Create depth maps using Midas depth estimation.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/imageutils/marigold-depth","name":"Marigold Depth Estimation","created_by":"fal","source":"official","description":"Create depth maps using Marigold depth estimation.","status":"active","release_date":"2023-12-28","model_type":"image","page_url":"https://fal.run/fal-ai/imageutils/marigold-depth","tagline":"Create depth maps using Marigold depth estimation.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/imageutils/nsfw","name":"NSFW Filter","created_by":"fal","source":"official","description":"Predict the probability of an image being NSFW.","status":"active","release_date":"2024-03-22","model_type":"other","page_url":"https://fal.run/fal-ai/imageutils/nsfw","tagline":"Predict the probability of an image being NSFW.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/imageutils/rembg","name":"Remove Background","created_by":"fal","source":"official","description":"Remove the background from an image.","status":"active","release_date":"2023-10-05","model_type":"image","page_url":"https://fal.run/fal-ai/imageutils/rembg","tagline":"Remove the background from an image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/index-tts-2/text-to-speech","name":"Index TTS 2.0","created_by":"fal","source":"official","description":"Generate natural, clear speeches using Index TTS 2.0 from IndexTeam","status":"active","release_date":"2025-10-07","model_type":"tts","page_url":"https://fal.run/fal-ai/index-tts-2/text-to-speech","tagline":"Generate natural, clear speeches using Index TTS 2.0 from IndexTeam","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/infinitalk/single-text","name":"Infinitalk","created_by":"fal","source":"official","description":"Infinitalk model generates a talking avatar video from a text and audio file.","status":"active","release_date":"2025-08-22","model_type":"video","page_url":"https://fal.run/fal-ai/infinitalk/single-text","tagline":"Infinitalk model generates a talking avatar video from a text and audio file.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/infinitalk/video-to-video","name":"Infinitalk","created_by":"fal","source":"official","description":"Infinitalk model generates a talking avatar video from an image and audio file.","status":"active","release_date":"2025-09-22","model_type":"other","page_url":"https://fal.run/fal-ai/infinitalk/video-to-video","tagline":"Infinitalk model generates a talking avatar video from an image and audio file.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/infinitalk","name":"Infinitalk","created_by":"fal","source":"official","description":"Infinitalk model generates a talking avatar video from an image and audio file.","status":"active","release_date":"2025-08-21","model_type":"other","page_url":"https://fal.run/fal-ai/infinitalk","tagline":"Infinitalk model generates a talking avatar video from an image and audio file.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/infinity-star/text-to-video","name":"Infinity Star","created_by":"fal","source":"official","description":"InfinityStar’s unified 8B spacetime autoregressive engine to turn any text prompt into crisp 720p videos - 10× faster than diffusion models.","status":"active","release_date":"2025-11-07","model_type":"video","page_url":"https://fal.run/fal-ai/infinity-star/text-to-video","tagline":"InfinityStar’s unified 8B spacetime autoregressive engine to turn any text prompt into crisp 720p videos - 10× faster than diffusion models.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/inpaint","name":"Inpainting sdxl and sd","created_by":"fal","source":"official","description":"Inpaint images with SD and SDXL","status":"active","release_date":"2023-11-04","model_type":"image","page_url":"https://fal.run/fal-ai/inpaint","tagline":"Inpaint images with SD and SDXL","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/instant-character","name":"Instant Character","created_by":"fal","source":"official","description":"InstantCharacter creates high-quality, consistent characters from text prompts, supporting diverse poses, styles, and appearances with strong identity control.","status":"active","release_date":"2025-04-18","model_type":"image","page_url":"https://fal.run/fal-ai/instant-character","tagline":"InstantCharacter creates high-quality, consistent characters from text prompts, supporting diverse poses, styles, and appearances with strong identity control.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/invisible-watermark","name":"Invisible Watermark","created_by":"fal","source":"official","description":"Invisible Watermark is a model that can add an invisible watermark to an image.","status":"active","release_date":"2025-03-14","model_type":"image","page_url":"https://fal.run/fal-ai/invisible-watermark","tagline":"Invisible Watermark is a model that can add an invisible watermark to an image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/inworld-tts","name":"Inworld TTS-1.5 Max","created_by":"fal","source":"official","description":"Text to Speech Endpoint for Inworld's TTS-1.5 Max.","status":"active","release_date":"2026-03-13","model_type":"tts","page_url":"https://fal.run/fal-ai/inworld-tts","tagline":"Text to Speech Endpoint for Inworld's TTS-1.5 Max.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/ip-adapter-face-id","name":"IP Adapter Face ID","created_by":"fal","source":"official","description":"High quality zero-shot personalization","status":"active","release_date":"2024-04-22","model_type":"image","page_url":"https://fal.run/fal-ai/ip-adapter-face-id","tagline":"High quality zero-shot personalization","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/janus","name":"DeepSeek Janus-Pro","created_by":"fal","source":"official","description":"DeepSeek Janus-Pro is a novel text-to-image model that unifies multimodal understanding and generation through an autoregressive framework","status":"active","release_date":"2025-01-28","model_type":"image","page_url":"https://fal.run/fal-ai/janus","tagline":"DeepSeek Janus-Pro is a novel text-to-image model that unifies multimodal understanding and generation through an autoregressive framework","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/joyai-image-edit","name":"Joyai Image Edit","created_by":"fal","source":"official","description":"All-in-one image AI with JoyAI-Image.","status":"active","release_date":"2026-04-06","model_type":"image","page_url":"https://fal.run/fal-ai/joyai-image-edit","tagline":"All-in-one image AI with JoyAI-Image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/kandinsky5-pro/image-to-video","name":"Kandinsky5 Pro","created_by":"fal","source":"official","description":"Kandinsky 5.0 Pro is a diffusion model for fast, high-quality image-to-video generation.","status":"active","release_date":"2025-12-23","model_type":"video","page_url":"https://fal.run/fal-ai/kandinsky5-pro/image-to-video","tagline":"Kandinsky 5.0 Pro is a diffusion model for fast, high-quality image-to-video generation.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kandinsky5-pro/text-to-video","name":"Kandinsky5 Pro","created_by":"fal","source":"official","description":"Kandinsky 5.0 Pro is a diffusion model for fast, high-quality text-to-video generation.","status":"active","release_date":"2025-12-23","model_type":"video","page_url":"https://fal.run/fal-ai/kandinsky5-pro/text-to-video","tagline":"Kandinsky 5.0 Pro is a diffusion model for fast, high-quality text-to-video generation.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kandinsky5/text-to-video/distill","name":"Kandinsky5","created_by":"fal","source":"official","description":"Kandinsky 5.0 Distilled is a lightweight diffusion model for fast, high-quality text-to-video generation.","status":"active","release_date":"2025-10-13","model_type":"video","page_url":"https://fal.run/fal-ai/kandinsky5/text-to-video/distill","tagline":"Kandinsky 5.0 Distilled is a lightweight diffusion model for fast, high-quality text-to-video generation.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kandinsky5/text-to-video","name":"Kandinsky5","created_by":"fal","source":"official","description":"Kandinsky 5.0 is a diffusion model for fast, high-quality text-to-video generation.","status":"active","release_date":"2025-10-13","model_type":"video","page_url":"https://fal.run/fal-ai/kandinsky5/text-to-video","tagline":"Kandinsky 5.0 is a diffusion model for fast, high-quality text-to-video generation.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kling-image/o1","name":"Kling O1 Image","created_by":"fal","source":"official","description":"Perform precise image edits using strong reference control, transforming subjects, styles, and local details while preserving visual consistency.","status":"active","release_date":"2025-12-01","model_type":"image","page_url":"https://fal.run/fal-ai/kling-image/o1","tagline":"Perform precise image edits using strong reference control, transforming subjects, styles, and local details while preserving visual consistency.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-image/o3/image-to-image","name":"Kling Image","created_by":"fal","source":"official","description":"Kling Omni 3: Top-tier image-to-image with flawless consistency.","status":"active","release_date":"2026-02-03","model_type":"image","page_url":"https://fal.run/fal-ai/kling-image/o3/image-to-image","tagline":"Kling Omni 3: Top-tier image-to-image with flawless consistency.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-image/o3/text-to-image","name":"Kling Image","created_by":"fal","source":"official","description":"Kling Omni 3: Top-tier text-to-image with flawless consistency.","status":"active","release_date":"2026-02-03","model_type":"image","page_url":"https://fal.run/fal-ai/kling-image/o3/text-to-image","tagline":"Kling Omni 3: Top-tier text-to-image with flawless consistency.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-image/v3/image-to-image","name":"Kling Image","created_by":"fal","source":"official","description":"Kling Image V3: Latest kling image model","status":"active","release_date":"2026-02-03","model_type":"image","page_url":"https://fal.run/fal-ai/kling-image/v3/image-to-image","tagline":"Kling Image V3: Latest kling image model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-image/v3/text-to-image","name":"Kling Image","created_by":"fal","source":"official","description":"Kling V3: Latest Kling Image model","status":"active","release_date":"2026-02-03","model_type":"image","page_url":"https://fal.run/fal-ai/kling-image/v3/text-to-image","tagline":"Kling V3: Latest Kling Image model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling/v1-5/kolors-virtual-try-on","name":"Kling Kolors Virtual TryOn v1.5","created_by":"fal","source":"official","description":"Kling Kolors Virtual TryOn v1.5 is a high quality image based Try-On endpoint which can be used for commercial try on.","status":"active","release_date":"2025-01-23","model_type":"image","page_url":"https://fal.run/fal-ai/kling/v1-5/kolors-virtual-try-on","tagline":"Kling Kolors Virtual TryOn v1.5 is a high quality image based Try-On endpoint which can be used for commercial try on.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/ai-avatar/v2/pro","name":"Kling AI Avatar v2 Pro","created_by":"fal","source":"official","description":"Kling AI Avatar v2 Pro: The premium endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","status":"active","release_date":"2025-12-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/ai-avatar/v2/pro","tagline":"Kling AI Avatar v2 Pro: The premium endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/ai-avatar/v2/standard","name":"Kling AI Avatar v2 Standard","created_by":"fal","source":"official","description":"Kling AI Avatar v2 Standard: Endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","status":"active","release_date":"2025-12-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/ai-avatar/v2/standard","tagline":"Kling AI Avatar v2 Standard: Endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/create-voice","name":"Kling Video Create Voice","created_by":"fal","source":"official","description":"Create Voices to be used with Kling Models Voice Control","status":"active","release_date":"2025-12-16","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/create-voice","tagline":"Create Voices to be used with Kling Models Voice Control","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/lipsync/audio-to-video","name":"Kling LipSync Audio-to-Video","created_by":"fal","source":"official","description":"Kling LipSync is an audio-to-video model that generates realistic lip movements from audio input.","status":"active","release_date":"2025-03-27","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/lipsync/audio-to-video","tagline":"Kling LipSync is an audio-to-video model that generates realistic lip movements from audio input.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/lipsync/text-to-video","name":"Kling LipSync Text-to-Video","created_by":"fal","source":"official","description":"Kling LipSync is a text-to-video model that generates realistic lip movements from text input.","status":"active","release_date":"2025-03-27","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/lipsync/text-to-video","tagline":"Kling LipSync is a text-to-video model that generates realistic lip movements from text input.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/o1/image-to-video","name":"Kling O1 First Frame Last Frame to Video [Pro]","created_by":"fal","source":"official","description":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","status":"active","release_date":"2025-12-01","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o1/image-to-video","tagline":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o1/reference-to-video","name":"Kling O1 Reference Image to Video [Pro]","created_by":"fal","source":"official","description":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","status":"active","release_date":"2025-12-01","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o1/reference-to-video","tagline":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o1/standard/image-to-video","name":"Kling O1 First Frame Last Frame to Video [Standard]","created_by":"fal","source":"official","description":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","status":"active","release_date":"2025-12-15","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o1/standard/image-to-video","tagline":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o1/standard/reference-to-video","name":"Kling O1 Reference Image to Video [Standard]","created_by":"fal","source":"official","description":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","status":"active","release_date":"2025-12-15","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o1/standard/reference-to-video","tagline":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o1/standard/video-to-video/edit","name":"Kling O1 Edit Video [Standard]","created_by":"fal","source":"official","description":"Edit an existing video using natural-language instructions, transforming subjects, settings, and style while retaining the original motion structure.","status":"active","release_date":"2025-12-15","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o1/standard/video-to-video/edit","tagline":"Edit an existing video using natural-language instructions, transforming subjects, settings, and style while retaining the original motion structure.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o1/standard/video-to-video/reference","name":"Kling O1 Reference Video to Video [Standard]","created_by":"fal","source":"official","description":"Kling O1 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","status":"active","release_date":"2025-12-15","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o1/standard/video-to-video/reference","tagline":"Kling O1 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o1/video-to-video/edit","name":"Kling O1 Edit Video [Pro]","created_by":"fal","source":"official","description":"Edit an existing video using natural-language instructions, transforming subjects, settings, and style while retaining the original motion structure.","status":"active","release_date":"2025-12-01","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o1/video-to-video/edit","tagline":"Edit an existing video using natural-language instructions, transforming subjects, settings, and style while retaining the original motion structure.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o1/video-to-video/reference","name":"Kling O1 Reference Video to Video [Pro]","created_by":"fal","source":"official","description":"Kling O1 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","status":"active","release_date":"2025-12-01","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o1/video-to-video/reference","tagline":"Kling O1 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/4k/image-to-video","name":"Kling Video","created_by":"fal","source":"official","description":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","status":"active","release_date":"2026-04-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/4k/image-to-video","tagline":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/4k/reference-to-video","name":"Kling Video","created_by":"fal","source":"official","description":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","status":"active","release_date":"2026-04-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/4k/reference-to-video","tagline":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/4k/text-to-video","name":"Kling Video","created_by":"fal","source":"official","description":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","status":"active","release_date":"2026-04-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/4k/text-to-video","tagline":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/pro/image-to-video","name":"Kling O3 Image to Video [Pro]","created_by":"fal","source":"official","description":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/pro/image-to-video","tagline":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/pro/reference-to-video","name":"Kling O3 Reference to Video [Pro]","created_by":"fal","source":"official","description":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/pro/reference-to-video","tagline":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/pro/text-to-video","name":"Kling O3 Text to Video [Pro]","created_by":"fal","source":"official","description":"Generate realistic videos using Kling O3 from Kling Team!","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/pro/text-to-video","tagline":"Generate realistic videos using Kling O3 from Kling Team!","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/pro/video-to-video/edit","name":"Kling O3 Edit Video [Pro]","created_by":"fal","source":"official","description":"Edit videos using Kling O3 from Kling Team!","status":"active","release_date":"2026-02-04","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o3/pro/video-to-video/edit","tagline":"Edit videos using Kling O3 from Kling Team!","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/pro/video-to-video/reference","name":"Kling O3 Reference Video to Video [Pro]","created_by":"fal","source":"official","description":"Kling O3 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","status":"active","release_date":"2026-02-04","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o3/pro/video-to-video/reference","tagline":"Kling O3 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/standard/image-to-video","name":"Kling O3 Image to Video [Pro]","created_by":"fal","source":"official","description":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/standard/image-to-video","tagline":"Generate a video by taking a start frame and an end frame, animating the transition between them while following text-driven style and scene guidance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/standard/reference-to-video","name":"Kling O3 Reference to Video [Standard]","created_by":"fal","source":"official","description":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/standard/reference-to-video","tagline":"Transform images, elements, and text into consistent, high-quality video scenes, ensuring stable character identity, object details, and environments.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/standard/text-to-video","name":"Kling O3 Text to Video [Standard]","created_by":"fal","source":"official","description":"Generate realistic videos using Kling O3 from Kling Team!","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/o3/standard/text-to-video","tagline":"Generate realistic videos using Kling O3 from Kling Team!","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/standard/video-to-video/edit","name":"Kling O3 Edit Video [Standard]","created_by":"fal","source":"official","description":"Edit videos using Kling O3 from Kling Team!","status":"active","release_date":"2026-02-04","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o3/standard/video-to-video/edit","tagline":"Edit videos using Kling O3 from Kling Team!","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/o3/standard/video-to-video/reference","name":"Kling O3 Reference Video to Video [Standard]","created_by":"fal","source":"official","description":"Kling O3 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","status":"active","release_date":"2026-02-04","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/o3/standard/video-to-video/reference","tagline":"Kling O3 Omni generates new shots guided by an input reference video, preserving cinematic language such as motion, and camera style to produce seamless scene continuity.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v1/pro/ai-avatar","name":"Kling AI Avatar Pro","created_by":"fal","source":"official","description":"Kling AI Avatar Pro: The premium endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","status":"active","release_date":"2025-09-13","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1/pro/ai-avatar","tagline":"Kling AI Avatar Pro: The premium endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1/standard/ai-avatar","name":"Kling AI Avatar","created_by":"fal","source":"official","description":"Kling AI Avatar Standard: Endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","status":"active","release_date":"2025-09-13","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1/standard/ai-avatar","tagline":"Kling AI Avatar Standard: Endpoint for creating avatar videos with realistic humans, animals, cartoons, or stylized characters","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v1/standard/effects","name":"Kling 1.0","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.0","status":"active","release_date":"2025-03-06","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1/standard/effects","tagline":"Generate video clips from your prompts using Kling 1.0","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1/standard/image-to-video","name":"Kling 1.0","created_by":"fal","source":"official","description":"Generate video clips from your images using Kling 1.0","status":"active","release_date":"2024-10-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1/standard/image-to-video","tagline":"Generate video clips from your images using Kling 1.0","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1/standard/text-to-video","name":"Kling 1.0","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.0","status":"active","release_date":"2024-12-03","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1/standard/text-to-video","tagline":"Generate video clips from your prompts using Kling 1.0","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1/tts","name":"Kling TTS","created_by":"fal","source":"official","description":"Generate speech from text prompts and different voices using the Kling TTS model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-09-13","model_type":"tts","page_url":"https://fal.run/fal-ai/kling-video/v1/tts","tagline":"Generate speech from text prompts and different voices using the Kling TTS model, which leverages advanced AI techniques to create high-quality text-to-speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v1.5/pro/effects","name":"Kling 1.5","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.5 (pro)","status":"active","release_date":"2025-03-06","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.5/pro/effects","tagline":"Generate video clips from your prompts using Kling 1.5 (pro)","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1.5/pro/image-to-video","name":"Kling 1.5","created_by":"fal","source":"official","description":"Generate video clips from your images using Kling 1.5 (pro)","status":"active","release_date":"2024-10-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.5/pro/image-to-video","tagline":"Generate video clips from your images using Kling 1.5 (pro)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1.5/pro/text-to-video","name":"Kling 1.5","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.5 (pro)","status":"active","release_date":"2024-11-25","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.5/pro/text-to-video","tagline":"Generate video clips from your prompts using Kling 1.5 (pro)","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1.6/pro/effects","name":"Kling 1.6","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.6 (pro)","status":"active","release_date":"2025-03-06","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/pro/effects","tagline":"Generate video clips from your prompts using Kling 1.6 (pro)","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1.6/pro/elements","name":"Kling 1.6 Elements","created_by":"fal","source":"official","description":"Generate video clips from your multiple image references using Kling 1.6 (pro)","status":"active","release_date":"2025-05-20","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/pro/elements","tagline":"Generate video clips from your multiple image references using Kling 1.6 (pro)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v1.6/pro/image-to-video","name":"Kling 1.6","created_by":"fal","source":"official","description":"Generate video clips from your images using Kling 1.6 (pro)","status":"active","release_date":"2025-01-07","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/pro/image-to-video","tagline":"Generate video clips from your images using Kling 1.6 (pro)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v1.6/pro/text-to-video","name":"Kling 1.6","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.6 (pro)","status":"active","release_date":"2025-02-27","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/pro/text-to-video","tagline":"Generate video clips from your prompts using Kling 1.6 (pro)","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1.6/standard/effects","name":"Kling 1.6","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.6 (std)","status":"active","release_date":"2025-03-06","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/standard/effects","tagline":"Generate video clips from your prompts using Kling 1.6 (std)","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1.6/standard/elements","name":"Kling 1.6 Elements","created_by":"fal","source":"official","description":"Generate video clips from your multiple image references using Kling 1.6 (standard)","status":"active","release_date":"2025-05-20","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/standard/elements","tagline":"Generate video clips from your multiple image references using Kling 1.6 (standard)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v1.6/standard/image-to-video","name":"Kling 1.6","created_by":"fal","source":"official","description":"Generate video clips from your images using Kling 1.6 (std)","status":"active","release_date":"2025-01-07","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/standard/image-to-video","tagline":"Generate video clips from your images using Kling 1.6 (std)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v1.6/standard/text-to-video","name":"Kling 1.6","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 1.6 (std)","status":"active","release_date":"2025-01-07","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v1.6/standard/text-to-video","tagline":"Generate video clips from your prompts using Kling 1.6 (std)","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-26","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v2/master/image-to-video","name":"Kling 2.0 Master","created_by":"fal","source":"official","description":"Generate video clips from your images using Kling 2.0 Master","status":"active","release_date":"2025-04-14","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2/master/image-to-video","tagline":"Generate video clips from your images using Kling 2.0 Master","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2/master/text-to-video","name":"Kling 2.0 Master","created_by":"fal","source":"official","description":"Generate video clips from your prompts using Kling 2.0 Master","status":"active","release_date":"2025-04-14","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2/master/text-to-video","tagline":"Generate video clips from your prompts using Kling 2.0 Master","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.1/master/image-to-video","name":"Kling 2.1 Master","created_by":"fal","source":"official","description":"Kling 2.1 Master: The premium endpoint for Kling 2.1, designed for top-tier image-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","status":"active","release_date":"2025-05-29","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.1/master/image-to-video","tagline":"Kling 2.1 Master: The premium endpoint for Kling 2.1, designed for top-tier image-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.1/master/text-to-video","name":"Kling 2.1 Master","created_by":"fal","source":"official","description":"Kling 2.1 Master: The premium endpoint for Kling 2.1, designed for top-tier text-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","status":"active","release_date":"2025-05-29","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.1/master/text-to-video","tagline":"Kling 2.1 Master: The premium endpoint for Kling 2.1, designed for top-tier text-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.1/pro/image-to-video","name":"Kling 2.1 (pro)","created_by":"fal","source":"official","description":"Kling 2.1 Pro is an advanced endpoint for the Kling 2.1 model, offering professional-grade videos with enhanced visual fidelity, precise camera movements, and dynamic motion control, perfect for cinematic storytelling.","status":"active","release_date":"2025-05-28","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.1/pro/image-to-video","tagline":"Kling 2.1 Pro is an advanced endpoint for the Kling 2.1 model, offering professional-grade videos with enhanced visual fidelity, precise camera movements, and dynamic motion control, perfect for cinem","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.1/standard/image-to-video","name":"Kling 2.1 (standard)","created_by":"fal","source":"official","description":"Kling 2.1 Standard is a cost-efficient endpoint for the Kling 2.1 model, delivering high-quality image-to-video generation \n\n","status":"active","release_date":"2025-05-28","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.1/standard/image-to-video","tagline":"Kling 2.1 Standard is a cost-efficient endpoint for the Kling 2.1 model, delivering high-quality image-to-video generation \n\n","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.5-turbo/pro/image-to-video","name":"Kling Video","created_by":"fal","source":"official","description":"Kling 2.5 Turbo Pro: Top-tier image-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","status":"active","release_date":"2025-09-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.5-turbo/pro/image-to-video","tagline":"Kling 2.5 Turbo Pro: Top-tier image-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.5-turbo/pro/text-to-video","name":"Kling v2.5 Text to Video","created_by":"fal","source":"official","description":"Kling 2.5 Turbo Pro: Top-tier text-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","status":"active","release_date":"2025-09-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.5-turbo/pro/text-to-video","tagline":"Kling 2.5 Turbo Pro: Top-tier text-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.5-turbo/standard/image-to-video","name":"Kling Video","created_by":"fal","source":"official","description":"Kling 2.5 Turbo Standard: Top-tier image-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","status":"active","release_date":"2025-10-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.5-turbo/standard/image-to-video","tagline":"Kling 2.5 Turbo Standard: Top-tier image-to-video generation with unparalleled motion fluidity, cinematic visuals, and exceptional prompt precision.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.6/pro/image-to-video","name":"Kling Video v2.6 Image to Video","created_by":"fal","source":"official","description":"Kling 2.6 Pro: Top-tier image-to-video with cinematic visuals, fluid motion, and native audio generation.","status":"active","release_date":"2025-12-02","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.6/pro/image-to-video","tagline":"Kling 2.6 Pro: Top-tier image-to-video with cinematic visuals, fluid motion, and native audio generation.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.6/pro/motion-control","name":"Kling Video v2.6 Motion Control [Pro]","created_by":"fal","source":"official","description":"Transfer movements from a reference video to any character image.","status":"active","release_date":"2025-12-21","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/v2.6/pro/motion-control","tagline":"Transfer movements from a reference video to any character image.","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.6/pro/text-to-video","name":"Kling Video v2.6 Text to Video","created_by":"fal","source":"official","description":"Kling 2.6 Pro: Top-tier text-to-video with cinematic visuals, fluid motion, and native audio generation.","status":"active","release_date":"2025-12-02","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v2.6/pro/text-to-video","tagline":"Kling 2.6 Pro: Top-tier text-to-video with cinematic visuals, fluid motion, and native audio generation.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v2.6/standard/motion-control","name":"Kling Video v2.6 Motion Control [Standard]","created_by":"fal","source":"official","description":"Transfer movements from a reference video to any character image.","status":"active","release_date":"2025-12-21","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/v2.6/standard/motion-control","tagline":"Transfer movements from a reference video to any character image.","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/4k/image-to-video","name":"Kling Video","created_by":"fal","source":"official","description":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","status":"active","release_date":"2026-04-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/4k/image-to-video","tagline":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/4k/text-to-video","name":"Kling Video V3 Text to Video 4K","created_by":"fal","source":"official","description":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","status":"active","release_date":"2026-04-22","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/4k/text-to-video","tagline":"Kling's Native 4K is a video generation model that directly outputs professional-grade 4K video in one step, eliminating the need for post-production upscaling","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/pro/image-to-video","name":"Kling Video v3 Image to Video [Pro]","created_by":"fal","source":"official","description":"Kling 3.0 Pro: Top-tier image-to-video with cinematic visuals, fluid motion, and native audio generation, with custom element support.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/pro/image-to-video","tagline":"Kling 3.0 Pro: Top-tier image-to-video with cinematic visuals, fluid motion, and native audio generation, with custom element support.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-05-29","last_updated":"2026-06-03"},{"id":"fal-ai/kling-video/v3/pro/motion-control","name":"Kling Video","created_by":"fal","source":"official","description":"Transfer movements from a reference video to any character image.","status":"active","release_date":"2026-03-05","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/v3/pro/motion-control","tagline":"Transfer movements from a reference video to any character image.","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/pro/text-to-video","name":"Kling Video v3 Text to Video [Pro]","created_by":"fal","source":"official","description":"Kling 3.0 Pro: Top-tier text-to-video with cinematic visuals, fluid motion, and native audio generation, with multi-shot support.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/pro/text-to-video","tagline":"Kling 3.0 Pro: Top-tier text-to-video with cinematic visuals, fluid motion, and native audio generation, with multi-shot support.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/standard/image-to-video","name":"Kling Video v3 Image to Video [Standard]","created_by":"fal","source":"official","description":"Kling 3.0 Standard: Top-tier image-to-video with cinematic visuals, fluid motion, and native audio generation, with custom element support.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/standard/image-to-video","tagline":"Kling 3.0 Standard: Top-tier image-to-video with cinematic visuals, fluid motion, and native audio generation, with custom element support.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/standard/motion-control","name":"Kling Video","created_by":"fal","source":"official","description":"Transfer movements from a reference video to any character image.","status":"active","release_date":"2026-03-05","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/v3/standard/motion-control","tagline":"Transfer movements from a reference video to any character image.","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/standard/text-to-video","name":"Kling Video v3 Text to Video [Standard]","created_by":"fal","source":"official","description":"Kling 3.0 Standard: Top-tier text-to-video with cinematic visuals, fluid motion, and native audio generation, with multi-shot support.","status":"active","release_date":"2026-02-04","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/standard/text-to-video","tagline":"Kling 3.0 Standard: Top-tier text-to-video with cinematic visuals, fluid motion, and native audio generation, with multi-shot support.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kling-video/v3/turbo/pro/image-to-video","name":"Kling Video V3 Turbo Pro Image to Video","created_by":"fal","source":"official","description":"Generate high quality 1080p videos from images using Kling's Turbo 3.0 model, with improved lipsync and multishot generation capabilities.","status":"active","release_date":"2026-06-16","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/turbo/pro/image-to-video","tagline":"Generate high quality 1080p videos from images using Kling's Turbo 3.0 model, with improved lipsync and multishot generation capabilities.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v3/turbo/pro/text-to-video","name":"Kling Video V3 Turbo Pro Text to Video","created_by":"fal","source":"official","description":"Generate high quality 1080p videos using Kling's Turbo 3.0 model, with improved lipsync and multishot generation capabilities.","status":"active","release_date":"2026-06-16","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/turbo/pro/text-to-video","tagline":"Generate high quality 1080p videos using Kling's Turbo 3.0 model, with improved lipsync and multishot generation capabilities.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v3/turbo/standard/image-to-video","name":"Kling Video V3 Standard Turbo Image to Video","created_by":"fal","source":"official","description":"Kling 3.0 Turbo Standard animates a first and last frame reference image into 720P video with native audio, delivering quick, affordable image-driven motion for fast turnaround","status":"active","release_date":"2026-06-16","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/turbo/standard/image-to-video","tagline":"Kling 3.0 Turbo Standard animates a first and last frame reference image into 720P video with native audio, delivering quick, affordable image-driven motion for fast turnaround","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/v3/turbo/standard/text-to-video","name":"Kling Video V3 Standard Turbo Text to Video","created_by":"fal","source":"official","description":"Kling 3.0 Turbo Standard is a fast, cost-efficient video generation model that turns text prompts directly into 720P video with native audio, optimized for rapid iteration and high-volume production","status":"active","release_date":"2026-06-16","model_type":"video","page_url":"https://fal.run/fal-ai/kling-video/v3/turbo/standard/text-to-video","tagline":"Kling 3.0 Turbo Standard is a fast, cost-efficient video generation model that turns text prompts directly into 720P video with native audio, optimized for rapid iteration and high-volume production","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kling-video/video-to-audio","name":"Kling Video","created_by":"fal","source":"official","description":"Generate audio from input videos using Kling","status":"active","release_date":"2025-10-09","model_type":"other","page_url":"https://fal.run/fal-ai/kling-video/video-to-audio","tagline":"Generate audio from input videos using Kling","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/american-english","name":"Kokoro TTS","created_by":"fal","source":"official","description":"Kokoro is a lightweight text-to-speech model that delivers comparable quality to larger models while being significantly faster and more cost-efficient.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/american-english","tagline":"Kokoro is a lightweight text-to-speech model that delivers comparable quality to larger models while being significantly faster and more cost-efficient.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/brazilian-portuguese","name":"Kokoro TTS (Brazilian Portuguese)","created_by":"fal","source":"official","description":"A natural and expressive Brazilian Portuguese text-to-speech model optimized for clarity and fluency.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/brazilian-portuguese","tagline":"A natural and expressive Brazilian Portuguese text-to-speech model optimized for clarity and fluency.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/british-english","name":"Kokoro TTS (British English)","created_by":"fal","source":"official","description":"A high-quality British English text-to-speech model offering natural and expressive voice synthesis.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/british-english","tagline":"A high-quality British English text-to-speech model offering natural and expressive voice synthesis.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/french","name":"Kokoro TTS (French)","created_by":"fal","source":"official","description":"An expressive and natural French text-to-speech model for both European and Canadian French.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/french","tagline":"An expressive and natural French text-to-speech model for both European and Canadian French.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/hindi","name":"Kokoro TTS (Hindi)","created_by":"fal","source":"official","description":"A fast and expressive Hindi text-to-speech model with clear pronunciation and accurate intonation.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/hindi","tagline":"A fast and expressive Hindi text-to-speech model with clear pronunciation and accurate intonation.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/italian","name":"Kokoro TTS (Italian)","created_by":"fal","source":"official","description":"A high-quality Italian text-to-speech model delivering smooth and expressive speech synthesis.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/italian","tagline":"A high-quality Italian text-to-speech model delivering smooth and expressive speech synthesis.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/japanese","name":"Kokoro TTS (Japanese)","created_by":"fal","source":"official","description":"A fast and natural-sounding Japanese text-to-speech model optimized for smooth pronunciation.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/japanese","tagline":"A fast and natural-sounding Japanese text-to-speech model optimized for smooth pronunciation.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/mandarin-chinese","name":"Kokoro TTS (Mandarin Chinese)","created_by":"fal","source":"official","description":"A highly efficient Mandarin Chinese text-to-speech model that captures natural tones and prosody.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/mandarin-chinese","tagline":"A highly efficient Mandarin Chinese text-to-speech model that captures natural tones and prosody.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kokoro/spanish","name":"Kokoro TTS (Spanish)","created_by":"fal","source":"official","description":"A natural-sounding Spanish text-to-speech model optimized for Latin American and European Spanish.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/kokoro/spanish","tagline":"A natural-sounding Spanish text-to-speech model optimized for Latin American and European Spanish.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/kolors/image-to-image","name":"Kolors Image to Image","created_by":"fal","source":"official","description":"Photorealistic Image-to-Image","status":"active","release_date":"2024-11-19","model_type":"image","page_url":"https://fal.run/fal-ai/kolors/image-to-image","tagline":"Photorealistic Image-to-Image","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/kolors","name":"Kolors","created_by":"fal","source":"official","description":"Photorealistic Text-to-Image","status":"active","release_date":"2024-07-24","model_type":"image","page_url":"https://fal.run/fal-ai/kolors","tagline":"Photorealistic Text-to-Image","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/krea-2-trainer","name":"Krea 2 Trainer","created_by":"fal","source":"official","description":"Train a custom LoRA on your own images to teach Krea 2 a new subject, character, or style.","status":"active","release_date":"2026-06-19","model_type":"other","page_url":"https://fal.run/fal-ai/krea-2-trainer","tagline":"Train a custom LoRA on your own images to teach Krea 2 a new subject, character, or style.","capabilities":{"vision":true},"last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/krea-2/turbo/lora","name":"Krea 2 Text to Image Turbo LoRA","created_by":"fal","source":"official","description":"Generate high-fidelity images from text with Krea 2 using a custom-trained LoRA.","status":"active","release_date":"2026-06-19","model_type":"image","page_url":"https://fal.run/fal-ai/krea-2/turbo/lora","tagline":"Generate high-fidelity images from text with Krea 2 using a custom-trained LoRA.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/krea-2/turbo","name":"Krea 2 Turbo","created_by":"fal","source":"official","description":"Generate high-fidelity images from text in seconds with Krea 2 Turbo, the speed-optimized open-source version of Krea 2, preserving its aesthetic range for rapid ideation.","status":"active","release_date":"2026-06-18","model_type":"image","page_url":"https://fal.run/fal-ai/krea-2/turbo","tagline":"Generate high-fidelity images from text in seconds with Krea 2 Turbo, the speed-optimized open-source version of Krea 2, preserving its aesthetic range for rapid ideation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/krea-wan-14b/text-to-video","name":"Krea Wan 14b- Text to Video","created_by":"fal","source":"official","description":"Fast Text-to-Video endpoint for Krea's Wan 14b model.","status":"active","release_date":"2025-10-20","model_type":"video","page_url":"https://fal.run/fal-ai/krea-wan-14b/text-to-video","tagline":"Fast Text-to-Video endpoint for Krea's Wan 14b model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/krea-wan-14b/video-to-video","name":"Krea Wan 14B","created_by":"fal","source":"official","description":"Superfast video model based on Wan 2.1 14b by Krea, excelling at real-time video-editing.","status":"active","release_date":"2025-10-14","model_type":"other","page_url":"https://fal.run/fal-ai/krea-wan-14b/video-to-video","tagline":"Superfast video model based on Wan 2.1 14b by Krea, excelling at real-time video-editing.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/latentsync","name":"LatentSync","created_by":"fal","source":"official","description":"LatentSync is a video-to-video model that generates lip sync animations from audio using advanced algorithms for high-quality synchronization.","status":"active","release_date":"2025-03-25","model_type":"other","page_url":"https://fal.run/fal-ai/latentsync","tagline":"LatentSync is a video-to-video model that generates lip sync animations from audio using advanced algorithms for high-quality synchronization.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/lava-sr","name":"Lava SR","created_by":"fal","source":"official","description":"Enhance muffled 16 kHz speech audio into crystal-clear 48 kHz, with denoising for particularly bad inputs.","status":"active","release_date":"2026-02-23","model_type":"other","page_url":"https://fal.run/fal-ai/lava-sr","tagline":"Enhance muffled 16 kHz speech audio into crystal-clear 48 kHz, with denoising for particularly bad inputs.","last_seen_at":"2026-02-23","last_updated":"2026-05-11"},{"id":"fal-ai/layer-diffusion","name":"Layer Diffusion XL","created_by":"fal","source":"official","description":"SDXL with an alpha channel.","status":"active","release_date":"2024-04-13","model_type":"image","page_url":"https://fal.run/fal-ai/layer-diffusion","tagline":"SDXL with an alpha channel.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/lcm-sd15-i2i","name":"Optimized Latent Consistency (SDv1.5)","created_by":"fal","source":"official","description":"Produce high-quality images with minimal inference steps.","status":"active","release_date":"2023-11-09","model_type":"image","page_url":"https://fal.run/fal-ai/lcm-sd15-i2i","tagline":"Produce high-quality images with minimal inference steps.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/lcm","name":"Latent Consistency (SDXL & SDv1.5)","created_by":"fal","source":"official","description":"Produce high-quality images with minimal inference steps.","status":"active","release_date":"2024-02-04","model_type":"image","page_url":"https://fal.run/fal-ai/lcm","tagline":"Produce high-quality images with minimal inference steps.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/leffa/pose-transfer","name":"Leffa Pose Transfer","created_by":"fal","source":"official","description":"Leffa Pose Transfer is an endpoint for changing pose of an image with a reference image.","status":"active","release_date":"2024-12-17","model_type":"image","page_url":"https://fal.run/fal-ai/leffa/pose-transfer","tagline":"Leffa Pose Transfer is an endpoint for changing pose of an image with a reference image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/leffa/virtual-tryon","name":"Leffa Virtual TryOn","created_by":"fal","source":"official","description":"Leffa Virtual TryOn is a high quality image based Try-On endpoint which can be used for commercial try on.","status":"active","release_date":"2024-12-17","model_type":"image","page_url":"https://fal.run/fal-ai/leffa/virtual-tryon","tagline":"Leffa Virtual TryOn is a high quality image based Try-On endpoint which can be used for commercial try on.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/lightning-models","name":"Lightning Models","created_by":"fal","source":"official","description":"Collection of SDXL Lightning models.","status":"active","release_date":"2024-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/lightning-models","tagline":"Collection of SDXL Lightning models.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/lightx/recamera","name":"Lightx","created_by":"fal","source":"official","description":"Use the capabilities of lightx to relight and recamera your videos.","status":"active","release_date":"2025-12-22","model_type":"other","page_url":"https://fal.run/fal-ai/lightx/recamera","tagline":"Use the capabilities of lightx to relight and recamera your videos.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/lightx/relight","name":"Lightx","created_by":"fal","source":"official","description":"Use tlightx capabilities to relight and recamera your videos.","status":"active","release_date":"2025-12-22","model_type":"other","page_url":"https://fal.run/fal-ai/lightx/relight","tagline":"Use tlightx capabilities to relight and recamera your videos.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/live-portrait/image","name":"Live Portrait","created_by":"fal","source":"official","description":"Transfer expression from a video to a portrait.","status":"active","release_date":"2024-10-01","model_type":"image","page_url":"https://fal.run/fal-ai/live-portrait/image","tagline":"Transfer expression from a video to a portrait.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/live-portrait","name":"Live Portrait","created_by":"fal","source":"official","description":"Transfer expression from a video to a portrait.","status":"active","release_date":"2024-07-09","model_type":"video","page_url":"https://fal.run/fal-ai/live-portrait","tagline":"Transfer expression from a video to a portrait.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/llava-next","name":"LLaVA v1.6 34B","created_by":"fal","source":"official","description":"Vision","status":"active","release_date":"2024-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/llava-next","tagline":"Vision","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/longcat-image/edit","name":"Longcat Image","created_by":"fal","source":"official","description":"LongCat image Edit is a 6B parameter image editing model excelling at multilingual text rendering, photorealism and deployment efficiency.","status":"active","release_date":"2025-12-05","model_type":"image","page_url":"https://fal.run/fal-ai/longcat-image/edit","tagline":"LongCat image Edit is a 6B parameter image editing model excelling at multilingual text rendering, photorealism and deployment efficiency.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-image","name":"Longcat Image","created_by":"fal","source":"official","description":"LongCat image is a 6B parameter model excelling at multilingual text rendering, photorealism and deployment efficiency.","status":"active","release_date":"2025-12-05","model_type":"image","page_url":"https://fal.run/fal-ai/longcat-image","tagline":"LongCat image is a 6B parameter model excelling at multilingual text rendering, photorealism and deployment efficiency.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-multi-avatar/image-audio-to-video/multi-speaker","name":"Longcat Multi Avatar","created_by":"fal","source":"official","description":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/longcat-multi-avatar/image-audio-to-video/multi-speaker","tagline":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-multi-avatar/image-audio-to-video","name":"Longcat Multi Avatar","created_by":"fal","source":"official","description":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","status":"active","release_date":"2026-01-08","model_type":"other","page_url":"https://fal.run/fal-ai/longcat-multi-avatar/image-audio-to-video","tagline":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-single-avatar/audio-to-video","name":"Longcat Single Avatar","created_by":"fal","source":"official","description":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/longcat-single-avatar/audio-to-video","tagline":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-single-avatar/image-audio-to-video","name":"Longcat Single Avatar","created_by":"fal","source":"official","description":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/longcat-single-avatar/image-audio-to-video","tagline":"LongCat-Video-Avatar is an audio-driven video generation model that can generates super-realistic, lip-synchronized long video generation with natural dynamics and consistent identity.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/distilled/image-to-video/480p","name":"LongCat Video Distilled","created_by":"fal","source":"official","description":"Generate long videos from images using LongCat Video Distilled","status":"active","release_date":"2025-10-29","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/distilled/image-to-video/480p","tagline":"Generate long videos from images using LongCat Video Distilled","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/distilled/image-to-video/720p","name":"LongCat Video Distilled","created_by":"fal","source":"official","description":"Generate long videos in 720p/30fps from images using LongCat Video Distilled","status":"active","release_date":"2025-10-30","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/distilled/image-to-video/720p","tagline":"Generate long videos in 720p/30fps from images using LongCat Video Distilled","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/distilled/text-to-video/480p","name":"LongCat Video Distilled","created_by":"fal","source":"official","description":"Generate long videos from text using LongCat Video Distilled","status":"active","release_date":"2025-10-28","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/distilled/text-to-video/480p","tagline":"Generate long videos from text using LongCat Video Distilled","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/distilled/text-to-video/720p","name":"LongCat Video Distilled","created_by":"fal","source":"official","description":"Generate long videos in 720p/30fps from text using LongCat Video Distilled","status":"active","release_date":"2025-10-30","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/distilled/text-to-video/720p","tagline":"Generate long videos in 720p/30fps from text using LongCat Video Distilled","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/image-to-video/480p","name":"LongCat Video","created_by":"fal","source":"official","description":"Generate long videos from images using LongCat Video","status":"active","release_date":"2025-10-30","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/image-to-video/480p","tagline":"Generate long videos from images using LongCat Video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/image-to-video/720p","name":"LongCat Video","created_by":"fal","source":"official","description":"Generate long videos in 720p/30fps from images using LongCat Video","status":"active","release_date":"2025-10-30","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/image-to-video/720p","tagline":"Generate long videos in 720p/30fps from images using LongCat Video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/text-to-video/480p","name":"LongCat Video","created_by":"fal","source":"official","description":"Generate long videos from text using LongCat Video","status":"active","release_date":"2025-10-30","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/text-to-video/480p","tagline":"Generate long videos from text using LongCat Video","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/longcat-video/text-to-video/720p","name":"LongCat Video","created_by":"fal","source":"official","description":"Generate long videos in 720p/30fps from text using LongCat Video","status":"active","release_date":"2025-10-30","model_type":"video","page_url":"https://fal.run/fal-ai/longcat-video/text-to-video/720p","tagline":"Generate long videos in 720p/30fps from text using LongCat Video","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/lora/image-to-image","name":"Stable Diffusion with LoRAs","created_by":"fal","source":"official","description":"Run Any Stable Diffusion model with customizable LoRA weights.","status":"active","release_date":"2024-04-17","model_type":"image","page_url":"https://fal.run/fal-ai/lora/image-to-image","tagline":"Run Any Stable Diffusion model with customizable LoRA weights.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/lora/inpaint","name":"Stable Diffusion with LoRAs","created_by":"fal","source":"official","description":"Run Any Stable Diffusion model with customizable LoRA weights.","status":"active","release_date":"2024-04-18","model_type":"image","page_url":"https://fal.run/fal-ai/lora/inpaint","tagline":"Run Any Stable Diffusion model with customizable LoRA weights.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/lora","name":"Stable Diffusion with LoRAs","created_by":"fal","source":"official","description":"Run Any Stable Diffusion model with customizable LoRA weights.","status":"active","release_date":"2023-09-26","model_type":"image","page_url":"https://fal.run/fal-ai/lora","tagline":"Run Any Stable Diffusion model with customizable LoRA weights.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-2-19b/audio-to-video/lora","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2 and custom LoRA","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/audio-to-video/lora","tagline":"Generate video with audio from audio, text and images using LTX-2 and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/audio-to-video","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/audio-to-video","tagline":"Generate video with audio from audio, text and images using LTX-2","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/audio-to-video/lora","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2 Distilled and custom LoRA","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/audio-to-video/lora","tagline":"Generate video with audio from audio, text and images using LTX-2 Distilled and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/audio-to-video","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2 Distilled","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/audio-to-video","tagline":"Generate video with audio from audio, text and images using LTX-2 Distilled","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/extend-video/lora","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Extend videos with audio using LTX-2 Distilled and custom LoRA","status":"active","release_date":"2026-01-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/extend-video/lora","tagline":"Extend videos with audio using LTX-2 Distilled and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/extend-video","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Extend videos with audio using LTX-2 Distilled","status":"active","release_date":"2026-01-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/extend-video","tagline":"Extend videos with audio using LTX-2 Distilled","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/image-to-video/lora","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2 Distilled and custom LoRA","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/image-to-video/lora","tagline":"Generate video with audio from images using LTX-2 Distilled and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/image-to-video","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2 Distilled","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/image-to-video","tagline":"Generate video with audio from images using LTX-2 Distilled","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/text-to-video/lora","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2 Distilled and custom LoRA","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/text-to-video/lora","tagline":"Generate video with audio from text using LTX-2 Distilled and custom LoRA","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/text-to-video","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2 Distilled","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/text-to-video","tagline":"Generate video with audio from text using LTX-2 Distilled","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/video-to-video/lora","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2 Distilled and custom LoRA","status":"active","release_date":"2026-01-07","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/video-to-video/lora","tagline":"Generate video with audio from videos using LTX-2 Distilled and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/distilled/video-to-video","name":"LTX-2 19B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2 Distilled","status":"active","release_date":"2026-01-07","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/distilled/video-to-video","tagline":"Generate video with audio from videos using LTX-2 Distilled","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/extend-video/lora","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Extend video with audio using LTX-2 and custom LoRA","status":"active","release_date":"2026-01-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/extend-video/lora","tagline":"Extend video with audio using LTX-2 and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/extend-video","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Extend video with audio using LTX-2","status":"active","release_date":"2026-01-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/extend-video","tagline":"Extend video with audio using LTX-2","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/image-to-video/lora","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2 and custom LoRA","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/image-to-video/lora","tagline":"Generate video with audio from images using LTX-2 and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/image-to-video","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/image-to-video","tagline":"Generate video with audio from images using LTX-2","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/text-to-video/lora","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2 and custom LoRA","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/text-to-video/lora","tagline":"Generate video with audio from text using LTX-2 and custom LoRA","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/text-to-video","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2","status":"active","release_date":"2026-01-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2-19b/text-to-video","tagline":"Generate video with audio from text using LTX-2","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/video-to-video/lora","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2 and custom LoRA","status":"active","release_date":"2026-01-07","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/video-to-video/lora","tagline":"Generate video with audio from videos using LTX-2 and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2-19b/video-to-video","name":"LTX-2 19B","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2","status":"active","release_date":"2026-01-07","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2-19b/video-to-video","tagline":"Generate video with audio from videos using LTX-2","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2/audio-to-video","name":"LTX 2.0 Video Pro","created_by":"fal","source":"official","description":"Generate video from audio using LTX-2","status":"active","release_date":"2026-03-04","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2/audio-to-video","tagline":"Generate video from audio using LTX-2","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2/extend-video","name":"LTX Video 2.0 Pro","created_by":"fal","source":"official","description":"Extends videos with audio using LTX-2","status":"active","release_date":"2026-03-04","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2/extend-video","tagline":"Extends videos with audio using LTX-2","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2/image-to-video/fast","name":"LTX Video 2.0 Fast","created_by":"fal","source":"official","description":"Create high-fidelity video with audio from images with LTX-2 Fast","status":"active","release_date":"2025-11-26","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2/image-to-video/fast","tagline":"Create high-fidelity video with audio from images with LTX-2 Fast","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2/image-to-video","name":"LTX Video 2.0 Pro","created_by":"fal","source":"official","description":"Create high-fidelity video with audio from images with LTX-2 Pro","status":"active","release_date":"2025-11-26","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2/image-to-video","tagline":"Create high-fidelity video with audio from images with LTX-2 Pro","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2/retake-video","name":"LTX Video 2.0 Retake","created_by":"fal","source":"official","description":"Change sections of a video using LTX-2","status":"active","release_date":"2025-11-26","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2/retake-video","tagline":"Change sections of a video using LTX-2","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2/text-to-video/fast","name":"LTX Video 2.0 Fast","created_by":"fal","source":"official","description":"Create high-fidelity video with audio from text with LTX-2 Fast","status":"active","release_date":"2025-11-26","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2/text-to-video/fast","tagline":"Create high-fidelity video with audio from text with LTX-2 Fast","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2/text-to-video","name":"LTX Video 2.0 Pro","created_by":"fal","source":"official","description":"Create high-fidelity video with audio from text with LTX-2 Pro.","status":"active","release_date":"2025-11-26","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2/text-to-video","tagline":"Create high-fidelity video with audio from text with LTX-2 Pro.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/audio-to-video/lora","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/audio-to-video/lora","tagline":"Generate video with audio from audio, text and images using LTX-2.3 and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/audio-to-video","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/audio-to-video","tagline":"Generate video with audio from audio, text and images using LTX-2","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/audio-to-video/lora","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2.3 Distilled and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/audio-to-video/lora","tagline":"Generate video with audio from audio, text and images using LTX-2.3 Distilled and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/audio-to-video","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from audio, text and images using LTX-2 Distilled","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/audio-to-video","tagline":"Generate video with audio from audio, text and images using LTX-2 Distilled","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/image-to-video/lora","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2.3 Distilled and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/image-to-video/lora","tagline":"Generate video with audio from images using LTX-2.3 Distilled and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/image-to-video","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2.3 Distilled","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/image-to-video","tagline":"Generate video with audio from images using LTX-2.3 Distilled","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/reference-video-to-video/lora","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from reference videos using LTX-2.3 Distilled and custom LoRA","status":"active","release_date":"2026-04-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/reference-video-to-video/lora","tagline":"Generate video with audio from reference videos using LTX-2.3 Distilled and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/reference-video-to-video","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from reference videos using LTX-2.3 Distilled","status":"active","release_date":"2026-04-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/reference-video-to-video","tagline":"Generate video with audio from reference videos using LTX-2.3 Distilled","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/text-to-video/lora","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2.3 Distilled and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/text-to-video/lora","tagline":"Generate video with audio from text using LTX-2.3 Distilled and custom LoRA","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/text-to-video","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2.3 Distilled","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/text-to-video","tagline":"Generate video with audio from text using LTX-2.3 Distilled","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/video-to-video/lora","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2.3 Distilled and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/video-to-video/lora","tagline":"Generate video with audio from videos using LTX-2.3 Distilled and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/distilled/video-to-video","name":"LTX-2.3 22B Distilled","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2.3 Distilled","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/distilled/video-to-video","tagline":"Generate video with audio from videos using LTX-2.3 Distilled","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/extend-video/lora","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Extend video with audio using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/extend-video/lora","tagline":"Extend video with audio using LTX-2.3 and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/extend-video","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Extend video with audio using LTX-2.3","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/extend-video","tagline":"Extend video with audio using LTX-2.3","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/image-to-video/lora","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/image-to-video/lora","tagline":"Generate video with audio from images using LTX-2.3 and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/image-to-video","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from images using LTX-2.3","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/image-to-video","tagline":"Generate video with audio from images using LTX-2.3","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/reference-video-to-video/lora","name":"LTX 2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from reference video, text and images using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-04-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/reference-video-to-video/lora","tagline":"Generate video with audio from reference video, text and images using LTX-2.3 and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/reference-video-to-video","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from reference video, text and images using LTX-2.3","status":"active","release_date":"2026-04-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/reference-video-to-video","tagline":"Generate video with audio from reference video, text and images using LTX-2.3","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/text-to-video/lora","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/text-to-video/lora","tagline":"Generate video with audio from text using LTX-2.3 and custom LoRA","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/text-to-video","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from text using LTX-2.3","status":"active","release_date":"2026-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/text-to-video","tagline":"Generate video with audio from text using LTX-2.3","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/video-to-video/lora","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/video-to-video/lora","tagline":"Generate video with audio from videos using LTX-2.3 and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-22b/video-to-video","name":"LTX-2.3 22B","created_by":"fal","source":"official","description":"Generate video with audio from videos using LTX-2.3","status":"active","release_date":"2026-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-22b/video-to-video","tagline":"Generate video with audio from videos using LTX-2.3","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3/audio-to-video","name":"LTX 2.3 Video Pro","created_by":"fal","source":"official","description":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","status":"active","release_date":"2026-03-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3/audio-to-video","tagline":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3/extend-video","name":"LTX Video 2.3 Pro","created_by":"fal","source":"official","description":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","status":"active","release_date":"2026-03-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3/extend-video","tagline":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3/image-to-video/fast","name":"LTX 2.3 Video Fast","created_by":"fal","source":"official","description":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","status":"active","release_date":"2026-03-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3/image-to-video/fast","tagline":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3/image-to-video","name":"LTX 2.3 Video Pro","created_by":"fal","source":"official","description":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","status":"active","release_date":"2026-03-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3/image-to-video","tagline":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/audio-to-video/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from audio, text and images using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-06-01","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/audio-to-video/lora","tagline":"Generate high-quality video with audio from audio, text and images using LTX-2.3 and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/audio-to-video","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from audio, text and images using LTX-2","status":"active","release_date":"2026-06-01","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/audio-to-video","tagline":"Generate high-quality video with audio from audio, text and images using LTX-2","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/colorization","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Colorize high-quality video using LTX-2.3","status":"active","release_date":"2026-06-24","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/colorization","tagline":"Colorize high-quality video using LTX-2.3","last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/cross-eyed","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Cross-eyes for high-quality video using LTX-2.3","status":"active","release_date":"2026-06-25","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/cross-eyed","tagline":"Cross-eyes for high-quality video using LTX-2.3","last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/day-to-night","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Day to Night for high-quality video using LTX-2.3","status":"active","release_date":"2026-06-25","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/day-to-night","tagline":"Day to Night for high-quality video using LTX-2.3","last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/deblur","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Deblur high-quality video using LTX-2.3\n","status":"active","release_date":"2026-06-24","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/deblur","tagline":"Deblur high-quality video using LTX-2.3\n","last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/decompression","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Decompression / Denoise high-quality video using LTX-2.3","status":"active","release_date":"2026-06-25","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/decompression","tagline":"Decompression / Denoise high-quality video using LTX-2.3","last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/hdr/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate HDR from reference video using LTX-2.3 with lora","status":"active","release_date":"2026-06-01","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/hdr/lora","tagline":"Generate HDR from reference video using LTX-2.3 with lora","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/hdr","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate HDR from reference video using LTX-2.3 ","status":"active","release_date":"2026-06-01","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/hdr","tagline":"Generate HDR from reference video using LTX-2.3 ","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/image-to-video/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from images using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-06-01","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/image-to-video/lora","tagline":"Generate high-quality video with audio from images using LTX-2.3 and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/image-to-video","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from images using LTX-2.3","status":"active","release_date":"2026-06-01","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/image-to-video","tagline":"Generate high-quality video with audio from images using LTX-2.3","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/ingredient","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from reference, character sheet, storyboard using LTX-2.3","status":"active","release_date":"2026-06-18","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/ingredient","tagline":"Generate high-quality video with audio from reference, character sheet, storyboard using LTX-2.3","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/inpaint/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Inpaint high-quality video using LTX-2.3 with lora","status":"active","release_date":"2026-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/inpaint/lora","tagline":"Inpaint high-quality video using LTX-2.3 with lora","last_seen_at":"2026-06-18","last_updated":"2026-06-18"},{"id":"fal-ai/ltx-2.3-quality/inpaint","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Inpaint high-quality video using LTX-2.3 ","status":"active","release_date":"2026-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/inpaint","tagline":"Inpaint high-quality video using LTX-2.3 ","last_seen_at":"2026-06-18","last_updated":"2026-06-18"},{"id":"fal-ai/ltx-2.3-quality/instant-shave","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Instant shave high-quality video using LTX-2.3","status":"active","release_date":"2026-06-25","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/instant-shave","tagline":"Instant shave high-quality video using LTX-2.3","last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/outpaint/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Outpaint high-quality video using LTX-2.3 with Lora","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/outpaint/lora","tagline":"Outpaint high-quality video using LTX-2.3 with Lora","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/outpaint","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Outpaint high-quality video using LTX-2.3 ","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/outpaint","tagline":"Outpaint high-quality video using LTX-2.3 ","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/reference-video-to-video/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from reference video, text and images using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-06-01","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/reference-video-to-video/lora","tagline":"Generate high-quality video with audio from reference video, text and images using LTX-2.3 and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/reference-video-to-video","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from reference video, text and images using LTX-2.3","status":"active","release_date":"2026-06-01","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/reference-video-to-video","tagline":"Generate high-quality video with audio from reference video, text and images using LTX-2.3","capabilities":{"vision":true},"last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/render-to-real","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Transform your 3D video render into realistic using first frame with Ltx 2.3","status":"active","release_date":"2026-06-26","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/render-to-real","tagline":"Transform your 3D video render into realistic using first frame with Ltx 2.3","last_seen_at":"2026-06-26","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/text-to-audio/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Text to Audio high-quality using LTX-2.3 with Lora","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/text-to-audio/lora","tagline":"Text to Audio high-quality using LTX-2.3 with Lora","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/text-to-audio","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Text to Audio high-quality using LTX-2.3 ","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/text-to-audio","tagline":"Text to Audio high-quality using LTX-2.3 ","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/text-to-video/lora","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from text using LTX-2.3 and custom LoRA","status":"active","release_date":"2026-06-01","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/text-to-video/lora","tagline":"Generate high-quality video with audio from text using LTX-2.3 and custom LoRA","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/text-to-video","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Generate high-quality video with audio from text using LTX-2.3","status":"active","release_date":"2026-06-01","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/text-to-video","tagline":"Generate high-quality video with audio from text using LTX-2.3","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3-quality/water-simulation","name":"Ltx 2.3 Quality","created_by":"fal","source":"official","description":"Water Simulation transformation for high-quality video using LTX-2.3","status":"active","release_date":"2026-06-25","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3-quality/water-simulation","tagline":"Water Simulation transformation for high-quality video using LTX-2.3","last_seen_at":"2026-06-25","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3/retake-video","name":"LTX Video 2.3 Pro","created_by":"fal","source":"official","description":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","status":"active","release_date":"2026-03-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-2.3/retake-video","tagline":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3/text-to-video/fast","name":"LTX 2.3 Video Fast","created_by":"fal","source":"official","description":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","status":"active","release_date":"2026-03-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3/text-to-video/fast","tagline":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-2.3/text-to-video","name":"LTX Video 2.3 Pro","created_by":"fal","source":"official","description":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","status":"active","release_date":"2026-03-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-2.3/text-to-video","tagline":"LTX-2.3 is a high-quality, fast AI video model available in Pro and Fast variants for text-to-video, image-to-video, and audio-to-video.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video-13b-dev/extend","name":"LTX Video-0.9.7 13B","created_by":"fal","source":"official","description":"Extend videos using LTX Video-0.9.7 13B and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"other","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-dev/extend","tagline":"Extend videos using LTX Video-0.9.7 13B and custom LoRA","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-video-13b-dev/image-to-video","name":"LTX Video-0.9.7 13B","created_by":"fal","source":"official","description":"Generate videos from prompts and images using LTX Video-0.9.7 13B and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"video","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-dev/image-to-video","tagline":"Generate videos from prompts and images using LTX Video-0.9.7 13B and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-video-13b-dev/multiconditioning","name":"LTX Video-0.9.7 13B","created_by":"fal","source":"official","description":"Generate videos from prompts, images, and videos using LTX Video-0.9.7 13B and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"other","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-dev/multiconditioning","tagline":"Generate videos from prompts, images, and videos using LTX Video-0.9.7 13B and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-video-13b-dev","name":"LTX Video-0.9.7 13B","created_by":"fal","source":"official","description":"Generate videos from prompts using LTX Video-0.9.7 13B and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"video","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-dev","tagline":"Generate videos from prompts using LTX Video-0.9.7 13B and custom LoRA","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-video-13b-distilled/extend","name":"LTX Video-0.9.7 13B Distilled","created_by":"fal","source":"official","description":"Extend videos using LTX Video-0.9.7 13B Distilled and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"other","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-distilled/extend","tagline":"Extend videos using LTX Video-0.9.7 13B Distilled and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video-13b-distilled/image-to-video","name":"LTX Video-0.9.7 13B Distilled","created_by":"fal","source":"official","description":"Generate videos from prompts and images using LTX Video-0.9.7 13B Distilled and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"video","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-distilled/image-to-video","tagline":"Generate videos from prompts and images using LTX Video-0.9.7 13B Distilled and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video-13b-distilled/multiconditioning","name":"LTX Video-0.9.7 13B Distilled","created_by":"fal","source":"official","description":"Generate videos from prompts, images, and videos using LTX Video-0.9.7 13B Distilled and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"other","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-distilled/multiconditioning","tagline":"Generate videos from prompts, images, and videos using LTX Video-0.9.7 13B Distilled and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video-13b-distilled","name":"LTX Video-0.9.7 13B Distilled","created_by":"fal","source":"official","description":"Generate videos from prompts using LTX Video-0.9.7 13B Distilled and custom LoRA","status":"active","release_date":"2025-05-17","model_type":"video","parameters":13,"page_url":"https://fal.run/fal-ai/ltx-video-13b-distilled","tagline":"Generate videos from prompts using LTX Video-0.9.7 13B Distilled and custom LoRA","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video/image-to-video","name":"LTX Video (preview)","created_by":"fal","source":"official","description":"Generate videos from images using LTX Video","status":"active","release_date":"2024-11-21","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-video/image-to-video","tagline":"Generate videos from images using LTX Video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video-lora/image-to-video","name":"LTX Video-0.9.7 LoRA","created_by":"fal","source":"official","description":"Generate videos from prompts and images using LTX Video-0.9.7 and custom LoRA","status":"active","release_date":"2025-05-15","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-video-lora/image-to-video","tagline":"Generate videos from prompts and images using LTX Video-0.9.7 and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-video-lora/multiconditioning","name":"LTX Video-0.9.7 LoRA","created_by":"fal","source":"official","description":"Generate videos from prompts, images, and videos using LTX Video-0.9.7 and custom LoRA","status":"active","release_date":"2025-05-15","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-video-lora/multiconditioning","tagline":"Generate videos from prompts, images, and videos using LTX Video-0.9.7 and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-video-trainer","name":"LTX Video Trainer","created_by":"fal","source":"official","description":"Train LTX Video 0.9.7 for custom styles and effects.","status":"active","release_date":"2025-05-08","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-video-trainer","tagline":"Train LTX Video 0.9.7 for custom styles and effects.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ltx-video-v095/extend","name":"LTX Video-0.9.5","created_by":"fal","source":"official","description":"Generate videos from prompts and videos using LTX Video-0.9.5","status":"active","release_date":"2025-03-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-video-v095/extend","tagline":"Generate videos from prompts and videos using LTX Video-0.9.5","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video-v095/multiconditioning","name":"LTX Video-0.9.5","created_by":"fal","source":"official","description":"Generate videos from prompts,images, and videos using LTX Video-0.9.5","status":"active","release_date":"2025-03-05","model_type":"other","page_url":"https://fal.run/fal-ai/ltx-video-v095/multiconditioning","tagline":"Generate videos from prompts,images, and videos using LTX Video-0.9.5","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video-v095","name":"LTX Video-0.9.5","created_by":"fal","source":"official","description":"Generate videos from prompts using LTX Video-0.9.5","status":"active","release_date":"2025-03-05","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-video-v095","tagline":"Generate videos from prompts using LTX Video-0.9.5","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx-video","name":"LTX Video (preview)","created_by":"fal","source":"official","description":"Generate videos from prompts using LTX Video","status":"active","release_date":"2024-10-04","model_type":"video","page_url":"https://fal.run/fal-ai/ltx-video","tagline":"Generate videos from prompts using LTX Video","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx2-v2v-trainer","name":"LTX-2 Video to Video Trainer","created_by":"fal","source":"official","description":"Train LTX-2 for video transformation or video-conditioned generation.","status":"active","release_date":"2026-01-07","model_type":"other","page_url":"https://fal.run/fal-ai/ltx2-v2v-trainer","tagline":"Train LTX-2 for video transformation or video-conditioned generation.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx2-video-trainer","name":"LTX-2 Video Trainer","created_by":"fal","source":"official","description":"Train LTX-2 for custom styles and effects.","status":"active","release_date":"2026-01-03","model_type":"other","page_url":"https://fal.run/fal-ai/ltx2-video-trainer","tagline":"Train LTX-2 for custom styles and effects.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ltx23-trainer-v2/a2a","name":"LTX 2.3 Trainer (V2) - Audio-to-Audio","created_by":"fal","source":"official","description":"Train a LoRA that transforms one audio clip into another, learning a reference→target mapping from paired audio examples.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/a2a","tagline":"Train a LoRA that transforms one audio clip into another, learning a reference→target mapping from paired audio examples.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/a2v","name":"LTX 2.3 Trainer (V2) - Audio-to-Video","created_by":"fal","source":"official","description":"Train a LoRA that generates video from a start image plus a conditioning audio track, producing motion that matches the sound.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/a2v","tagline":"Train a LoRA that generates video from a start image plus a conditioning audio track, producing motion that matches the sound.","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/audio-extend-prefix","name":"LTX 2.3 Trainer (V2) - Forward Audio Extension","created_by":"fal","source":"official","description":"Train a LoRA that continues an audio clip forward in time, generating the audio that follows a short clean prefix.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/audio-extend-prefix","tagline":"Train a LoRA that continues an audio clip forward in time, generating the audio that follows a short clean prefix.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/audio-extend-suffix","name":"LTX 2.3 Trainer (V2) - Backward Audio Extension","created_by":"fal","source":"official","description":"Train a LoRA that generates the lead-in to an audio clip, extending audio backward in time from its ending.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/audio-extend-suffix","tagline":"Train a LoRA that generates the lead-in to an audio clip, extending audio backward in time from its ending.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/audio-inpaint","name":"LTX 2.3 Trainer (V2) - Audio Inpainting","created_by":"fal","source":"official","description":"Train a LoRA that regenerates masked time spans of an audio clip while keeping the rest unchanged.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/audio-inpaint","tagline":"Train a LoRA that regenerates masked time spans of an audio clip while keeping the rest unchanged.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/av2av-masked","name":"LTX 2.3 Trainer (V2) - Masked Audio+Video Transformation","created_by":"fal","source":"official","description":"Train a LoRA that regenerates a masked video region (guided by kept pixels and a video reference) while jointly generating audio from an audio reference.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/av2av-masked","tagline":"Train a LoRA that regenerates a masked video region (guided by kept pixels and a video reference) while jointly generating audio from an audio reference.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/av2av","name":"LTX 2.3 Trainer (V2) - Audio+Video Reference Transformation","created_by":"fal","source":"official","description":"Train a LoRA for a joint audio+video transformation, conditioned on a reference clip (its video and audio) to produce a matching target clip.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/av2av","tagline":"Train a LoRA for a joint audio+video transformation, conditioned on a reference clip (its video and audio) to produce a matching target clip.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/extend-prefix","name":"LTX 2.3 Trainer (V2) - Forward Video Extension","created_by":"fal","source":"official","description":"Train a LoRA that continues a video forward in time — supply an opening clip at inference and the model generates what comes next.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/extend-prefix","tagline":"Train a LoRA that continues a video forward in time — supply an opening clip at inference and the model generates what comes next.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/extend-suffix","name":"LTX 2.3 Trainer (V2) - Backward Video Extension","created_by":"fal","source":"official","description":"Train a LoRA that generates the lead-in to a video, extending a clip backward in time from its ending.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/extend-suffix","tagline":"Train a LoRA that generates the lead-in to a video, extending a clip backward in time from its ending.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/i2v","name":"LTX 2.3 Trainer (V2) - Image-to-Video","created_by":"fal","source":"official","description":"Fine-tune LTX 2.3 to animate a starting image — supply a still plus a prompt at inference and the model generates a video that begins from that frame.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/i2v","tagline":"Fine-tune LTX 2.3 to animate a starting image — supply a still plus a prompt at inference and the model generates a video that begins from that frame.","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/ic-lora/a2a","name":"LTX 2.3 Trainer (V2) - Audio-to-Audio IC-LoRA","created_by":"fal","source":"official","description":"Train an IC-LoRA that transforms one audio clip into another, conditioned at inference on a reference audio clip.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/ic-lora/a2a","tagline":"Train an IC-LoRA that transforms one audio clip into another, conditioned at inference on a reference audio clip.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/ic-lora/av2av-masked","name":"LTX 2.3 Trainer (V2) - Masked Audio+Video IC-LoRA","created_by":"fal","source":"official","description":"Train an IC-LoRA that regenerates a masked video region (guided by kept pixels and a video reference) while jointly generating audio from an audio reference.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/ic-lora/av2av-masked","tagline":"Train an IC-LoRA that regenerates a masked video region (guided by kept pixels and a video reference) while jointly generating audio from an audio reference.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/ic-lora/av2av","name":"LTX 2.3 Trainer (V2) - Audio+Video Reference IC-LoRA","created_by":"fal","source":"official","description":"Train an IC-LoRA for a joint audio+video transformation, conditioned on a reference clip's video and audio to produce a matching target.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/ic-lora/av2av","tagline":"Train an IC-LoRA for a joint audio+video transformation, conditioned on a reference clip's video and audio to produce a matching target.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/ic-lora/v2v-masked","name":"LTX 2.3 Trainer (V2) - Masked Video-to-Video IC-LoRA","created_by":"fal","source":"official","description":"Train an IC-LoRA that regenerates only the masked region of a video, guided by the kept pixels and a separate reference/control video.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/ic-lora/v2v-masked","tagline":"Train an IC-LoRA that regenerates only the masked region of a video, guided by the kept pixels and a separate reference/control video.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/ic-lora/v2v","name":"LTX 2.3 Trainer (V2) - Video-to-Video IC-LoRA","created_by":"fal","source":"official","description":"Train an IC-LoRA that learns a video-to-video transformation from paired before/after clips, conditioned at inference on a reference (control) video.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/ic-lora/v2v","tagline":"Train an IC-LoRA that learns a video-to-video transformation from paired before/after clips, conditioned at inference on a reference (control) video.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/inpaint","name":"LTX 2.3 Trainer (V2) - Video Inpainting","created_by":"fal","source":"official","description":"Train a LoRA that regenerates a masked region of a video while keeping the rest unchanged, blending the new content with its surroundings.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/inpaint","tagline":"Train a LoRA that regenerates a masked region of a video while keeping the rest unchanged, blending the new content with its surroundings.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/interpolate","name":"LTX 2.3 Trainer (V2) - Keyframe Interpolation","created_by":"fal","source":"official","description":"Train a LoRA that generates the video between keyframes — supply first/last (and optional middle) frames at inference and the model fills the in-between motion.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/interpolate","tagline":"Train a LoRA that generates the video between keyframes — supply first/last (and optional middle) frames at inference and the model fills the in-between motion.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/outpaint","name":"LTX 2.3 Trainer (V2) - Spatial Outpainting","created_by":"fal","source":"official","description":"Train a LoRA that expands the video frame outward, keeping an inner rectangle fixed and generating the surrounding region.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/outpaint","tagline":"Train a LoRA that expands the video frame outward, keeping an inner rectangle fixed and generating the surrounding region.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/t2a","name":"LTX 2.3 Trainer (V2) - Text-to-Audio","created_by":"fal","source":"official","description":"Train a LoRA that generates audio from a text prompt — the audio counterpart of text-to-video — learning a sound or style from your clips.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/t2a","tagline":"Train a LoRA that generates audio from a text prompt — the audio counterpart of text-to-video — learning a sound or style from your clips.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/t2v","name":"LTX 2.3 Trainer (V2) - Text-to-Video","created_by":"fal","source":"official","description":"Fine-tune LTX 2.3 on your own clips to teach it a new subject, character, object, or visual style, then generate full videos from a text prompt.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/t2v","tagline":"Fine-tune LTX 2.3 on your own clips to teach it a new subject, character, object, or visual style, then generate full videos from a text prompt.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/v2a","name":"LTX 2.3 Trainer (V2) - Video-to-Audio","created_by":"fal","source":"official","description":"Train a LoRA that generates audio (foley / sound design) for a silent video, learning a soundtrack that matches the on-screen action.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/v2a","tagline":"Train a LoRA that generates audio (foley / sound design) for a silent video, learning a soundtrack that matches the on-screen action.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/v2v-masked","name":"LTX 2.3 Trainer (V2) - Masked Video-to-Video","created_by":"fal","source":"official","description":"Train a LoRA that regenerates only the masked region of a video, guided by both the kept pixels and a separate reference/control video.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/v2v-masked","tagline":"Train a LoRA that regenerates only the masked region of a video, guided by both the kept pixels and a separate reference/control video.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-trainer-v2/v2v","name":"LTX 2.3 Trainer (V2) - Video-to-Video","created_by":"fal","source":"official","description":"Train a LoRA that learns a video-to-video transformation from paired before/after clips, steered at inference by a reference (control) video.","status":"active","release_date":"2026-06-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-trainer-v2/v2v","tagline":"Train a LoRA that learns a video-to-video transformation from paired before/after clips, steered at inference by a reference (control) video.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-v2v-trainer","name":"LTX-2.3 22B Video to Video Trainer","created_by":"fal","source":"official","description":"Train LTX-2.3 22B for video transformation or video-conditioned generation.","status":"active","release_date":"2026-03-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-v2v-trainer","tagline":"Train LTX-2.3 22B for video transformation or video-conditioned generation.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltx23-video-trainer","name":"LTX-2.3 22B Video Trainer","created_by":"fal","source":"official","description":"Train LTX-2.3 22B for custom styles and effects.","status":"active","release_date":"2026-03-17","model_type":"other","page_url":"https://fal.run/fal-ai/ltx23-video-trainer","tagline":"Train LTX-2.3 22B for custom styles and effects.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltxv-13b-098-distilled/extend","name":"LTX-Video 13B 0.9.8 Distilled","created_by":"fal","source":"official","description":"Extend videos using LTX Video-0.9.8 13B Distilled and custom LoRA","status":"active","release_date":"2025-07-23","model_type":"other","parameters":13,"page_url":"https://fal.run/fal-ai/ltxv-13b-098-distilled/extend","tagline":"Extend videos using LTX Video-0.9.8 13B Distilled and custom LoRA","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltxv-13b-098-distilled/image-to-video","name":"LTX-Video 13B 0.9.8 Distilled","created_by":"fal","source":"official","description":"Generate long videos from prompts and images using LTX Video-0.9.8 13B Distilled and custom LoRA","status":"active","release_date":"2025-07-17","model_type":"video","parameters":13,"page_url":"https://fal.run/fal-ai/ltxv-13b-098-distilled/image-to-video","tagline":"Generate long videos from prompts and images using LTX Video-0.9.8 13B Distilled and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltxv-13b-098-distilled/multiconditioning","name":"LTX-Video 13B 0.9.8 Distilled","created_by":"fal","source":"official","description":"Generate long videos from prompts, images, and videos using LTX Video-0.9.8 13B Distilled and custom LoRA","status":"active","release_date":"2025-07-17","model_type":"other","parameters":13,"page_url":"https://fal.run/fal-ai/ltxv-13b-098-distilled/multiconditioning","tagline":"Generate long videos from prompts, images, and videos using LTX Video-0.9.8 13B Distilled and custom LoRA","capabilities":{"vision":true},"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/ltxv-13b-098-distilled","name":"LTX-Video 13B 0.9.8 Distilled","created_by":"fal","source":"official","description":"Generate long videos from prompts using LTX Video-0.9.8 13B Distilled and custom LoRA","status":"active","release_date":"2025-07-17","model_type":"video","parameters":13,"page_url":"https://fal.run/fal-ai/ltxv-13b-098-distilled","tagline":"Generate long videos from prompts using LTX Video-0.9.8 13B Distilled and custom LoRA","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/lucidflux","name":"Lucidflux","created_by":"fal","source":"official","description":"LucidFlux for upscaling images with very high fidelity","status":"active","release_date":"2025-10-03","model_type":"image","page_url":"https://fal.run/fal-ai/lucidflux","tagline":"LucidFlux for upscaling images with very high fidelity","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-dream-machine/ray-2-flash/image-to-video","name":"Luma Ray 2 Flash (Image to Video)","created_by":"fal","source":"official","description":"Ray2 Flash is a fast video generative model capable of creating realistic visuals with natural, coherent motion.","status":"active","release_date":"2025-03-17","model_type":"video","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2-flash/image-to-video","tagline":"Ray2 Flash is a fast video generative model capable of creating realistic visuals with natural, coherent motion.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-dream-machine/ray-2-flash/modify","name":"Luma Ray 2 Flash Modify","created_by":"fal","source":"official","description":"Ray2 Flash Modify is a video generative model capable of restyling or retexturing the entire shot, from turning live-action into CG or stylized animation, to changing wardrobe, props, or the overall a","status":"active","release_date":"2025-07-17","model_type":"other","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2-flash/modify","tagline":"Ray2 Flash Modify is a video generative model capable of restyling or retexturing the entire shot, from turning live-action into CG or stylized animation, to changing wardrobe, props, or the overall a","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/luma-dream-machine/ray-2-flash/reframe","name":"Luma Ray 2 Flash Reframe","created_by":"fal","source":"official","description":"Adjust and enhance videos with Ray-2 Reframe.","status":"active","release_date":"2025-06-03","model_type":"other","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2-flash/reframe","tagline":"Adjust and enhance videos with Ray-2 Reframe.","capabilities":{"tool_call":true},"tools":["function_calling"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-dream-machine/ray-2-flash","name":"Luma Ray 2 Flash","created_by":"fal","source":"official","description":"Ray2 Flash is a fast video generative model capable of creating realistic visuals with natural, coherent motion.","status":"active","release_date":"2025-03-17","model_type":"video","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2-flash","tagline":"Ray2 Flash is a fast video generative model capable of creating realistic visuals with natural, coherent motion.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-dream-machine/ray-2/image-to-video","name":"Luma Ray 2 (Image to Video)","created_by":"fal","source":"official","description":"Ray2 is a large-scale video generative model capable of creating realistic visuals with natural, coherent motion.","status":"active","release_date":"2025-02-14","model_type":"video","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2/image-to-video","tagline":"Ray2 is a large-scale video generative model capable of creating realistic visuals with natural, coherent motion.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-dream-machine/ray-2/modify","name":"Luma Ray 2 Modify","created_by":"fal","source":"official","description":"Ray2 Modify is a video generative model capable of restyling or retexturing the entire shot, from turning live-action into CG or stylized animation, to changing wardrobe, props, or the overall aesthet","status":"active","release_date":"2025-06-28","model_type":"other","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2/modify","tagline":"Ray2 Modify is a video generative model capable of restyling or retexturing the entire shot, from turning live-action into CG or stylized animation, to changing wardrobe, props, or the overall aesthet","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-dream-machine/ray-2/reframe","name":"Luma Ray 2 Reframe","created_by":"fal","source":"official","description":"Adjust and enhance videos with Ray-2 Reframe.","status":"active","release_date":"2025-06-03","model_type":"other","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2/reframe","tagline":"Adjust and enhance videos with Ray-2 Reframe.","capabilities":{"tool_call":true},"tools":["function_calling"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-dream-machine/ray-2","name":"Luma Ray 2","created_by":"fal","source":"official","description":"Ray2 is a large-scale video generative model capable of creating realistic visuals with natural, coherent motion.","status":"active","release_date":"2025-01-27","model_type":"video","page_url":"https://fal.run/fal-ai/luma-dream-machine/ray-2","tagline":"Ray2 is a large-scale video generative model capable of creating realistic visuals with natural, coherent motion.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-photon/flash/modify","name":"Luma Photon","created_by":"fal","source":"official","description":"Edit images from your prompts using Luma Photon.","status":"active","release_date":"2025-06-08","model_type":"image","page_url":"https://fal.run/fal-ai/luma-photon/flash/modify","tagline":"Edit images from your prompts using Luma Photon.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-photon/flash/reframe","name":"Luma Photon Flash Reframe","created_by":"fal","source":"official","description":"This advanced tool intelligently expands your visuals, seamlessly blending new content to enhance creativity and adaptability, offering unmatched speed and quality for creators at a fraction of the co","status":"active","release_date":"2025-06-03","model_type":"image","page_url":"https://fal.run/fal-ai/luma-photon/flash/reframe","tagline":"This advanced tool intelligently expands your visuals, seamlessly blending new content to enhance creativity and adaptability, offering unmatched speed and quality for creators at a fraction of the co","capabilities":{"vision":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"tools":["function_calling"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-photon/flash","name":"Luma Photon Flash","created_by":"fal","source":"official","description":"Generate images from your prompts using Luma Photon Flash.","status":"active","release_date":"2024-12-03","model_type":"image","page_url":"https://fal.run/fal-ai/luma-photon/flash","tagline":"Generate images from your prompts using Luma Photon Flash.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-photon/modify","name":"Luma Photon","created_by":"fal","source":"official","description":"Edit images from your prompts using Luma Photon.","status":"active","release_date":"2025-06-08","model_type":"image","page_url":"https://fal.run/fal-ai/luma-photon/modify","tagline":"Edit images from your prompts using Luma Photon.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-photon/reframe","name":"Luma Photon Reframe","created_by":"fal","source":"official","description":"Extend and reframe images with Luma Photon Reframe.","status":"active","release_date":"2025-06-03","model_type":"image","page_url":"https://fal.run/fal-ai/luma-photon/reframe","tagline":"Extend and reframe images with Luma Photon Reframe.","capabilities":{"vision":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"tools":["function_calling"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/luma-photon","name":"Luma Photon","created_by":"fal","source":"official","description":"Generate images from your prompts using Luma Photon.","status":"active","release_date":"2024-06-03","model_type":"image","page_url":"https://fal.run/fal-ai/luma-photon","tagline":"Generate images from your prompts using Luma Photon.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/lumina-image/v2","name":"Lumina Image 2","created_by":"fal","source":"official","description":"Lumina-Image-2.0 is a 2 billion parameter flow-based diffusion transforer which features improved performance in image quality, typography, complex prompt understanding, and resource-efficiency.","status":"active","release_date":"2025-01-31","model_type":"image","page_url":"https://fal.run/fal-ai/lumina-image/v2","tagline":"Lumina-Image-2.0 is a 2 billion parameter flow-based diffusion transforer which features improved performance in image quality, typography, complex prompt understanding, and resource-efficiency.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/lux-tts","name":"Lux TTS","created_by":"fal","source":"official","description":"High-quality voice cloning TTS model that generates 48kHz speech from text and a reference audio.","status":"active","release_date":"2026-03-12","model_type":"tts","page_url":"https://fal.run/fal-ai/lux-tts","tagline":"High-quality voice cloning TTS model that generates 48kHz speech from text and a reference audio.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-03-12","last_updated":"2026-05-11"},{"id":"fal-ai/lyra-2/zoom","name":"Lyra 2","created_by":"fal","source":"official","description":"Lyra 2.0 is an image-to-video model that turns a single image into an explorable 3D-style video with camera-controlled motion.","status":"active","release_date":"2026-04-21","model_type":"video","page_url":"https://fal.run/fal-ai/lyra-2/zoom","tagline":"Lyra 2.0 is an image-to-video model that turns a single image into an explorable 3D-style video with camera-controlled motion.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/lyria2","name":"Lyria2","created_by":"fal","source":"official","description":"Lyria 2 is Google's latest music generation model, you can generate any type of music with this model.","status":"active","release_date":"2025-05-20","model_type":"other","page_url":"https://fal.run/fal-ai/lyria2","tagline":"Lyria 2 is Google's latest music generation model, you can generate any type of music with this model.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/lyria3/pro","name":"Lyria 3 Pro","created_by":"fal","source":"official","description":"Lyria 3 Pro is the latest music model from Google","status":"active","release_date":"2026-05-20","model_type":"other","page_url":"https://fal.run/fal-ai/lyria3/pro","tagline":"Lyria 3 Pro is the latest music model from Google","last_seen_at":"2026-05-26","last_updated":"2026-06-03"},{"id":"fal-ai/lyria3","name":"Lyria3","created_by":"fal","source":"official","description":"Lyria 3 is most recent music model from Google","status":"active","release_date":"2026-03-30","model_type":"other","page_url":"https://fal.run/fal-ai/lyria3","tagline":"Lyria 3 is most recent music model from Google","last_seen_at":"2026-05-22","last_updated":"2026-06-03"},{"id":"fal-ai/magi-distilled/extend-video","name":"MAGI-1 (Distilled)","created_by":"fal","source":"official","description":"MAGI-1 distilled extends videos faster with an exceptional understanding of physical interactions and prompts","status":"active","release_date":"2025-04-23","model_type":"other","page_url":"https://fal.run/fal-ai/magi-distilled/extend-video","tagline":"MAGI-1 distilled extends videos faster with an exceptional understanding of physical interactions and prompts","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/magi-distilled/image-to-video","name":"MAGI-1 (Distilled)","created_by":"fal","source":"official","description":"MAGI-1 distilled generates videos faster from images with exceptional understanding of physical interactions and prompting","status":"active","release_date":"2025-04-23","model_type":"video","page_url":"https://fal.run/fal-ai/magi-distilled/image-to-video","tagline":"MAGI-1 distilled generates videos faster from images with exceptional understanding of physical interactions and prompting","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/magi-distilled","name":"MAGI-1 (Distilled)","created_by":"fal","source":"official","description":"MAGI-1 distilled is a faster video generation model with exceptional understanding of physical interactions and cinematic prompts","status":"active","release_date":"2025-04-22","model_type":"video","page_url":"https://fal.run/fal-ai/magi-distilled","tagline":"MAGI-1 distilled is a faster video generation model with exceptional understanding of physical interactions and cinematic prompts","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/magi/extend-video","name":"MAGI-1","created_by":"fal","source":"official","description":"MAGI-1 extends videos with an exceptional understanding of physical interactions and prompts","status":"active","release_date":"2025-04-23","model_type":"other","page_url":"https://fal.run/fal-ai/magi/extend-video","tagline":"MAGI-1 extends videos with an exceptional understanding of physical interactions and prompts","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/magi/image-to-video","name":"MAGI-1","created_by":"fal","source":"official","description":"MAGI-1 generates videos from images with exceptional understanding of physical interactions and prompting","status":"active","release_date":"2025-04-23","model_type":"video","page_url":"https://fal.run/fal-ai/magi/image-to-video","tagline":"MAGI-1 generates videos from images with exceptional understanding of physical interactions and prompting","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/magi","name":"MAGI-1","created_by":"fal","source":"official","description":"MAGI-1 is a video generation model with exceptional understanding of physical interactions and cinematic prompts","status":"active","release_date":"2025-04-23","model_type":"video","page_url":"https://fal.run/fal-ai/magi","tagline":"MAGI-1 is a video generation model with exceptional understanding of physical interactions and cinematic prompts","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/marlin/find","name":"Marlin Find","created_by":"fal","source":"official","description":"Marlin is a 2B video VLM tuned for the two questions developers actually want to ask of their videos: what is happening, and when?","status":"active","release_date":"2026-05-21","model_type":"other","page_url":"https://fal.run/fal-ai/marlin/find","tagline":"Marlin is a 2B video VLM tuned for the two questions developers actually want to ask of their videos: what is happening, and when?","capabilities":{"vision":true},"last_seen_at":"2026-05-21","last_updated":"2026-06-03"},{"id":"fal-ai/marlin","name":"Marlin","created_by":"fal","source":"official","description":"Marlin is a 2B video VLM tuned for the two questions developers actually want to ask of their videos: what is happening, and when?","status":"active","release_date":"2026-05-21","model_type":"other","page_url":"https://fal.run/fal-ai/marlin","tagline":"Marlin is a 2B video VLM tuned for the two questions developers actually want to ask of their videos: what is happening, and when?","capabilities":{"vision":true},"last_seen_at":"2026-05-21","last_updated":"2026-06-03"},{"id":"fal-ai/maya/batch","name":"Maya","created_by":"fal","source":"official","description":"Maya1 is a state-of-the-art speech model by Maya Research for expressive voice generation, built to capture real human emotion and precise voice design.","status":"active","release_date":"2025-12-12","model_type":"tts","page_url":"https://fal.run/fal-ai/maya/batch","tagline":"Maya1 is a state-of-the-art speech model by Maya Research for expressive voice generation, built to capture real human emotion and precise voice design.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/maya/stream","name":"Maya","created_by":"fal","source":"official","description":"Maya1 is a state-of-the-art speech model by Maya Research for expressive voice generation, built to capture real human emotion and precise voice design.","status":"active","release_date":"2025-12-12","model_type":"tts","page_url":"https://fal.run/fal-ai/maya/stream","tagline":"Maya1 is a state-of-the-art speech model by Maya Research for expressive voice generation, built to capture real human emotion and precise voice design.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/maya","name":"Maya1","created_by":"fal","source":"official","description":"Maya1 is a state-of-the-art speech model by Maya Research for expressive voice generation, built to capture real human emotion and precise voice design.","status":"active","release_date":"2025-11-15","model_type":"tts","page_url":"https://fal.run/fal-ai/maya","tagline":"Maya1 is a state-of-the-art speech model by Maya Research for expressive voice generation, built to capture real human emotion and precise voice design.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/meshy/rigging/multi-animation","name":"Meshy Rigging Multi Animation","created_by":"fal","source":"official","description":"Meshy auto-rigs a humanoid 3D model fitting a skeleton and binding the mesh, then applies several motion presets from its animation library","status":"active","release_date":"2026-06-12","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/rigging/multi-animation","tagline":"Meshy auto-rigs a humanoid 3D model fitting a skeleton and binding the mesh, then applies several motion presets from its animation library","last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/rigging","name":"Meshy Rigging","created_by":"fal","source":"official","description":"Rig humanoid 3D models from GLB URLs with Meshy, returning rigged GLB/FBX files plus basic animations.","status":"active","release_date":"2026-05-19","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/rigging","tagline":"Rig humanoid 3D models from GLB URLs with Meshy, returning rigged GLB/FBX files plus basic animations.","last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v5/multi-image-to-3d","name":"Meshy 5 Multi","created_by":"fal","source":"official","description":"Meshy-5 multi image generates realistic and production ready 3D models from multiple images.","status":"active","release_date":"2025-10-06","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v5/multi-image-to-3d","tagline":"Meshy-5 multi image generates realistic and production ready 3D models from multiple images.","capabilities":{"vision":true},"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v5/remesh","name":"Meshy 5 Remesh","created_by":"fal","source":"official","description":"Meshy-5 remesh allows you to remesh and export existing 3D models into various formats","status":"active","release_date":"2025-10-18","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v5/remesh","tagline":"Meshy-5 remesh allows you to remesh and export existing 3D models into various formats","last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v5/retexture","name":"Meshy 5 Retexture","created_by":"fal","source":"official","description":"Meshy-5 retexture applies new, high-quality textures to existing 3D models using either text prompts or reference images.","status":"active","release_date":"2025-10-18","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v5/retexture","tagline":"Meshy-5 retexture applies new, high-quality textures to existing 3D models using either text prompts or reference images.","capabilities":{"vision":true},"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v6/image-to-3d","name":"Meshy 6","created_by":"fal","source":"official","description":"Meshy-6 is the latest model from Meshy.","status":"active","release_date":"2026-02-09","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v6/image-to-3d","tagline":"Meshy-6 is the latest model from Meshy.","capabilities":{"vision":true},"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v6/multi-image-to-3d","name":"Meshy 6 - Multi Image To 3D","created_by":"fal","source":"official","description":"Meshy-6 is the latest model from Meshy.","status":"active","release_date":"2026-04-23","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v6/multi-image-to-3d","tagline":"Meshy-6 is the latest model from Meshy.","capabilities":{"vision":true},"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v6-preview/image-to-3d","name":"Meshy 6 Preview","created_by":"fal","source":"official","description":"Meshy-6-Preview is the latest model from Meshy.","status":"active","release_date":"2025-10-06","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v6-preview/image-to-3d","tagline":"Meshy-6-Preview is the latest model from Meshy.","capabilities":{"vision":true},"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v6-preview/text-to-3d","name":"Meshy 6 Preview","created_by":"fal","source":"official","description":"Meshy-6-Preview is the latest model from Meshy.","status":"active","release_date":"2025-10-06","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v6-preview/text-to-3d","tagline":"Meshy-6-Preview is the latest model from Meshy.","last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/meshy/v6/text-to-3d","name":"Meshy 6","created_by":"fal","source":"official","description":"Meshy-6 is the latest model from Meshy.","status":"active","release_date":"2026-02-09","model_type":"other","page_url":"https://fal.run/fal-ai/meshy/v6/text-to-3d","tagline":"Meshy-6 is the latest model from Meshy.","last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/minimax/hailuo-02-fast/image-to-video","name":"Minimax","created_by":"fal","source":"official","family":"minimax","description":"Create blazing fast and economical videos with MiniMax Hailuo-02 Image To Video API at 512p resolution","status":"active","release_date":"2025-08-06","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-02-fast/image-to-video","tagline":"Create blazing fast and economical videos with MiniMax Hailuo-02 Image To Video API at 512p resolution","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/minimax/hailuo-02/pro/image-to-video","name":"MiniMax Hailuo 02 [Pro] (Image to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-02 Image To Video API (Pro, 1080p): Advanced image-to-video generation model with 1080p resolution","status":"active","release_date":"2025-06-18","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-02/pro/image-to-video","tagline":"MiniMax Hailuo-02 Image To Video API (Pro, 1080p): Advanced image-to-video generation model with 1080p resolution","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-02/pro/text-to-video","name":"MiniMax Hailuo 02 [Pro] (Text to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-02 Text To Video API (Pro, 1080p): Advanced video generation model with 1080p resolution","status":"active","release_date":"2025-06-18","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-02/pro/text-to-video","tagline":"MiniMax Hailuo-02 Text To Video API (Pro, 1080p): Advanced video generation model with 1080p resolution","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-02/standard/image-to-video","name":"MiniMax Hailuo 02 [Standard] (Image to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-02 Image To Video API (Standard, 768p, 512p): Advanced image-to-video generation model with 768p and 512p resolutions","status":"active","release_date":"2025-06-18","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-02/standard/image-to-video","tagline":"MiniMax Hailuo-02 Image To Video API (Standard, 768p, 512p): Advanced image-to-video generation model with 768p and 512p resolutions","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-02/standard/text-to-video","name":"MiniMax Hailuo 02 [Standard] (Text to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-02 Text To Video API (Standard, 768p): Advanced video generation model with 768p resolution","status":"active","release_date":"2025-06-18","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-02/standard/text-to-video","tagline":"MiniMax Hailuo-02 Text To Video API (Standard, 768p): Advanced video generation model with 768p resolution","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-2.3-fast/pro/image-to-video","name":"MiniMax Hailuo 2.3 Fast [Pro] (Image to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-2.3-Fast Image To Video API (Pro, 1080p): Advanced fast image-to-video generation model with 1080p resolution","status":"active","release_date":"2025-10-27","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-2.3-fast/pro/image-to-video","tagline":"MiniMax Hailuo-2.3-Fast Image To Video API (Pro, 1080p): Advanced fast image-to-video generation model with 1080p resolution","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-2.3-fast/standard/image-to-video","name":"MiniMax Hailuo 2.3 Fast [Standard] (Image to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-2.3-Fast Image To Video API (Standard, 768p): Advanced fast image-to-video generation model with 768p resolution","status":"active","release_date":"2025-10-27","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-2.3-fast/standard/image-to-video","tagline":"MiniMax Hailuo-2.3-Fast Image To Video API (Standard, 768p): Advanced fast image-to-video generation model with 768p resolution","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-2.3/pro/image-to-video","name":"MiniMax Hailuo 2.3 [Pro] (Image to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-2.3 Image To Video API (Pro, 1080p): Advanced image-to-video generation model with 1080p resolution","status":"active","release_date":"2025-10-27","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-2.3/pro/image-to-video","tagline":"MiniMax Hailuo-2.3 Image To Video API (Pro, 1080p): Advanced image-to-video generation model with 1080p resolution","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-2.3/pro/text-to-video","name":"MiniMax Hailuo 2.3 [Pro] (Text to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-2.3 Text To Video API (Pro, 1080p): Advanced text-to-video generation model with 1080p resolution","status":"active","release_date":"2025-10-27","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-2.3/pro/text-to-video","tagline":"MiniMax Hailuo-2.3 Text To Video API (Pro, 1080p): Advanced text-to-video generation model with 1080p resolution","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-2.3/standard/image-to-video","name":"MiniMax Hailuo 2.3 [Standard] (Image to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-2.3 Image To Video API (Standard, 768p): Advanced image-to-video generation model with 768p resolution","status":"active","release_date":"2025-10-27","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-2.3/standard/image-to-video","tagline":"MiniMax Hailuo-2.3 Image To Video API (Standard, 768p): Advanced image-to-video generation model with 768p resolution","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/hailuo-2.3/standard/text-to-video","name":"MiniMax Hailuo 2.3 [Standard] (Text to Video)","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Hailuo-2.3 Text To Video API (Standard, 768p): Advanced text-to-video generation model with 768p resolution","status":"active","release_date":"2025-10-27","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/hailuo-2.3/standard/text-to-video","tagline":"MiniMax Hailuo-2.3 Text To Video API (Standard, 768p): Advanced text-to-video generation model with 768p resolution","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/image-01/subject-reference","name":"Minimax Image Subject Reference","created_by":"fal","source":"official","family":"minimax","description":"Generate images from text and a reference image using MiniMax Image-01 for consistent character appearance.","status":"active","release_date":"2025-05-06","model_type":"image","page_url":"https://fal.run/fal-ai/minimax/image-01/subject-reference","tagline":"Generate images from text and a reference image using MiniMax Image-01 for consistent character appearance.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/image-01","name":"MiniMax (Hailuo AI) Text to Image","created_by":"fal","source":"official","family":"minimax","description":"Generate high quality images from text prompts using MiniMax Image-01.","status":"active","release_date":"2025-05-06","model_type":"image","page_url":"https://fal.run/fal-ai/minimax/image-01","tagline":"Generate high quality images from text prompts using MiniMax Image-01.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax-music/v1.5","name":"MiniMax (Hailuo AI) Music v1.5","created_by":"fal","source":"official","family":"minimax","description":"Generate music from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality, diverse musical compositions.","status":"active","release_date":"2025-09-11","model_type":"other","page_url":"https://fal.run/fal-ai/minimax-music/v1.5","tagline":"Generate music from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality, diverse musical compositions.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/minimax-music/v2.5","name":"Minimax Music 2.5","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Music 2.5 creates complete tracks with singing, backing music, and detailed arrangements from lyrics and a style description.","status":"active","release_date":"2026-04-11","model_type":"other","page_url":"https://fal.run/fal-ai/minimax-music/v2.5","tagline":"MiniMax Music 2.5 creates complete tracks with singing, backing music, and detailed arrangements from lyrics and a style description.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax-music/v2.6","name":"Minimax Music 2.6","created_by":"fal","source":"official","family":"minimax","description":"MiniMax Music 2.6 creates complete tracks with singing, backing music, and detailed arrangements from lyrics and a style description.","status":"active","release_date":"2026-04-11","model_type":"other","page_url":"https://fal.run/fal-ai/minimax-music/v2.6","tagline":"MiniMax Music 2.6 creates complete tracks with singing, backing music, and detailed arrangements from lyrics and a style description.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax-music/v2","name":"Minimax Music","created_by":"fal","source":"official","family":"minimax","description":"Generate music from text prompts using the MiniMax Music 2.0 model, which leverages advanced AI techniques to create high-quality, diverse musical compositions.","status":"active","release_date":"2025-10-30","model_type":"other","page_url":"https://fal.run/fal-ai/minimax-music/v2","tagline":"Generate music from text prompts using the MiniMax Music 2.0 model, which leverages advanced AI techniques to create high-quality, diverse musical compositions.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax-music","name":"MiniMax (Hailuo AI) Music","created_by":"fal","source":"official","family":"minimax","description":"Generate music from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality, diverse musical compositions.","status":"active","release_date":"2024-12-17","model_type":"other","page_url":"https://fal.run/fal-ai/minimax-music","tagline":"Generate music from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality, diverse musical compositions.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/minimax/preview/speech-2.5-hd","name":"Minimax","created_by":"fal","source":"official","family":"minimax","description":"Generate speech from text prompts and different voices using the MiniMax Speech-02 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-08-11","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/preview/speech-2.5-hd","tagline":"Generate speech from text prompts and different voices using the MiniMax Speech-02 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/minimax/preview/speech-2.5-turbo","name":"Minimax","created_by":"fal","source":"official","family":"minimax","description":"Generate fast speech from text prompts and different voices using the MiniMax Speech-02 Turbo model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-08-11","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/preview/speech-2.5-turbo","tagline":"Generate fast speech from text prompts and different voices using the MiniMax Speech-02 Turbo model, which leverages advanced AI techniques to create high-quality text-to-speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/minimax/speech-02-hd","name":"MiniMax Speech-02 HD","created_by":"fal","source":"official","family":"minimax","description":"Generate speech from text prompts and different voices using the MiniMax Speech-02 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-05-06","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/speech-02-hd","tagline":"Generate speech from text prompts and different voices using the MiniMax Speech-02 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/minimax/speech-02-turbo","name":"MiniMax Speech-02 Turbo","created_by":"fal","source":"official","family":"minimax","description":"Generate fast speech from text prompts and different voices using the MiniMax Speech-02 Turbo model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-05-06","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/speech-02-turbo","tagline":"Generate fast speech from text prompts and different voices using the MiniMax Speech-02 Turbo model, which leverages advanced AI techniques to create high-quality text-to-speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/minimax/speech-2.6-hd","name":"MiniMax Speech 2.6 [HD]","created_by":"fal","source":"official","family":"minimax","description":"Generate speech from text prompts and different voices using the MiniMax Speech-2.6 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-10-29","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/speech-2.6-hd","tagline":"Generate speech from text prompts and different voices using the MiniMax Speech-2.6 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/speech-2.6-turbo","name":"MiniMax Speech 2.6 [Turbo]","created_by":"fal","source":"official","family":"minimax","description":"Generate speech from text prompts and different voices using the MiniMax Speech-2.6 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-10-29","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/speech-2.6-turbo","tagline":"Generate speech from text prompts and different voices using the MiniMax Speech-2.6 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/speech-2.8-hd","name":"MiniMax Speech 2.8 [HD]","created_by":"fal","source":"official","family":"minimax","description":"Generate speech from text prompts and different voices using the MiniMax Speech-2.8 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2026-02-04","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/speech-2.8-hd","tagline":"Generate speech from text prompts and different voices using the MiniMax Speech-2.8 HD model, which leverages advanced AI techniques to create high-quality text-to-speech.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/speech-2.8-turbo","name":"MiniMax Speech 2.8 [Turbo]","created_by":"fal","source":"official","family":"minimax","description":"Generate speech from text prompts and different voices using the MiniMax Speech-2.8 Turbo model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2026-02-04","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/speech-2.8-turbo","tagline":"Generate speech from text prompts and different voices using the MiniMax Speech-2.8 Turbo model, which leverages advanced AI techniques to create high-quality text-to-speech.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/video-01-director/image-to-video","name":"MiniMax (Hailuo AI) Video 01 Director - Image to Video","created_by":"fal","source":"official","family":"minimax","description":"Generate video clips more accurately with respect to initial image, natural language descriptions, and using camera movement instructions for shot control.","status":"active","release_date":"2025-02-24","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/video-01-director/image-to-video","tagline":"Generate video clips more accurately with respect to initial image, natural language descriptions, and using camera movement instructions for shot control.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/video-01-director","name":"MiniMax (Hailuo AI) Video 01 Director","created_by":"fal","source":"official","family":"minimax","description":"Generate video clips more accurately with respect to natural language descriptions and using camera movement instructions for shot control.","status":"active","release_date":"2025-02-11","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/video-01-director","tagline":"Generate video clips more accurately with respect to natural language descriptions and using camera movement instructions for shot control.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/video-01/image-to-video","name":"MiniMax (Hailuo AI) Video 01","created_by":"fal","source":"official","family":"minimax","description":"Generate video clips from your images using MiniMax Video model","status":"active","release_date":"2024-10-30","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/video-01/image-to-video","tagline":"Generate video clips from your images using MiniMax Video model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/video-01-live/image-to-video","name":"MiniMax (Hailuo AI) Video 01","created_by":"fal","source":"official","family":"minimax","description":"Generate video clips from your images using MiniMax Video model","status":"active","release_date":"2024-12-16","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/video-01-live/image-to-video","tagline":"Generate video clips from your images using MiniMax Video model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/video-01-live","name":"MiniMax (Hailuo AI) Video 01 Live","created_by":"fal","source":"official","family":"minimax","description":"Generate video clips from your prompts using MiniMax model","status":"active","release_date":"2024-12-16","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/video-01-live","tagline":"Generate video clips from your prompts using MiniMax model","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/video-01-subject-reference","name":"MiniMax (Hailuo AI) Video 01 Subject Reference","created_by":"fal","source":"official","family":"minimax","description":"Generate video clips maintaining consistent, realistic facial features and identity across dynamic video content","status":"active","release_date":"2025-01-20","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/video-01-subject-reference","tagline":"Generate video clips maintaining consistent, realistic facial features and identity across dynamic video content","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/video-01","name":"MiniMax (Hailuo AI) Video 01","created_by":"fal","source":"official","family":"minimax","description":"Generate video clips from your prompts using MiniMax model","status":"active","release_date":"2024-02-13","model_type":"video","page_url":"https://fal.run/fal-ai/minimax/video-01","tagline":"Generate video clips from your prompts using MiniMax model","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/voice-clone","name":"MiniMax Voice Cloning","created_by":"fal","source":"official","family":"minimax","description":"Clone a voice from a sample audio and generate speech from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-05-06","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/voice-clone","tagline":"Clone a voice from a sample audio and generate speech from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality text-to-speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/minimax/voice-design","name":"MiniMax Voice Design","created_by":"fal","source":"official","family":"minimax","description":"Design a personalized voice from a text description, and generate speech from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality text-to-speech.","status":"active","release_date":"2025-07-18","model_type":"tts","page_url":"https://fal.run/fal-ai/minimax/voice-design","tagline":"Design a personalized voice from a text description, and generate speech from text prompts using the MiniMax model, which leverages advanced AI techniques to create high-quality text-to-speech.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/mix-dehaze-net","name":"MixDehazer","created_by":"fal","source":"official","description":"An advanced dehaze model to remove atmospheric haze, restoring clarity and detail in images through intelligent neural network processing.","status":"active","release_date":"2025-03-24","model_type":"image","page_url":"https://fal.run/fal-ai/mix-dehaze-net","tagline":"An advanced dehaze model to remove atmospheric haze, restoring clarity and detail in images through intelligent neural network processing.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/mmaudio-v2/text-to-audio","name":"MMAudio V2 Text to Audio","created_by":"fal","source":"official","description":"MMAudio generates synchronized audio given text inputs.","status":"active","release_date":"2024-12-20","model_type":"other","page_url":"https://fal.run/fal-ai/mmaudio-v2/text-to-audio","tagline":"MMAudio generates synchronized audio given text inputs.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/mmaudio-v2","name":"MMAudio V2","created_by":"fal","source":"official","description":"MMAudio generates synchronized audio given video and/or text inputs.","status":"active","release_date":"2024-12-12","model_type":"other","page_url":"https://fal.run/fal-ai/mmaudio-v2","tagline":"MMAudio generates synchronized audio given video and/or text inputs.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/mochi-v1","name":"Mochi 1","created_by":"fal","source":"official","description":"Mochi 1 preview is an open state-of-the-art video generation model with high-fidelity motion and strong prompt adherence in preliminary evaluation.","status":"active","release_date":"2024-11-07","model_type":"video","page_url":"https://fal.run/fal-ai/mochi-v1","tagline":"Mochi 1 preview is an open state-of-the-art video generation model with high-fidelity motion and strong prompt adherence in preliminary evaluation.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/moondream/batched","name":"Moondream","created_by":"fal","source":"official","description":"Answer questions from the images.","status":"active","release_date":"2024-03-20","model_type":"other","page_url":"https://fal.run/fal-ai/moondream/batched","tagline":"Answer questions from the images.","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/moondream-next/batch","name":"MoonDreamNext Batch","created_by":"fal","source":"official","description":"MoonDreamNext Batch is a multimodal vision-language model for batch captioning.","status":"active","release_date":"2025-01-17","model_type":"other","page_url":"https://fal.run/fal-ai/moondream-next/batch","tagline":"MoonDreamNext Batch is a multimodal vision-language model for batch captioning.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream-next/detection","name":"MoonDreamNext Detection","created_by":"fal","source":"official","description":"MoonDreamNext Detection is a multimodal vision-language model for gaze detection, bbox detection, point detection, and more.","status":"active","release_date":"2025-01-09","model_type":"image","page_url":"https://fal.run/fal-ai/moondream-next/detection","tagline":"MoonDreamNext Detection is a multimodal vision-language model for gaze detection, bbox detection, point detection, and more.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream-next","name":"MoonDreamNext","created_by":"fal","source":"official","description":"MoonDreamNext is a multimodal vision-language model for captioning, gaze detection, bbox detection, point detection, and more.","status":"active","release_date":"2025-01-09","model_type":"other","page_url":"https://fal.run/fal-ai/moondream-next","tagline":"MoonDreamNext is a multimodal vision-language model for captioning, gaze detection, bbox detection, point detection, and more.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream2/object-detection","name":"Moondream2","created_by":"fal","source":"official","description":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","status":"active","release_date":"2025-04-26","model_type":"other","page_url":"https://fal.run/fal-ai/moondream2/object-detection","tagline":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream2/point-object-detection","name":"Moondream2","created_by":"fal","source":"official","description":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","status":"active","release_date":"2025-04-26","model_type":"other","page_url":"https://fal.run/fal-ai/moondream2/point-object-detection","tagline":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream2/visual-query","name":"Moondream2","created_by":"fal","source":"official","description":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","status":"active","release_date":"2025-04-26","model_type":"other","page_url":"https://fal.run/fal-ai/moondream2/visual-query","tagline":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream2","name":"Moondream2","created_by":"fal","source":"official","description":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","status":"active","release_date":"2025-04-26","model_type":"other","page_url":"https://fal.run/fal-ai/moondream2","tagline":"Moondream2 is a highly efficient open-source vision language model that combines powerful image understanding capabilities with a remarkably small footprint.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream3-preview/caption","name":"Moondream3 Preview [Caption]","created_by":"fal","source":"official","description":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","status":"active","release_date":"2025-10-09","model_type":"other","page_url":"https://fal.run/fal-ai/moondream3-preview/caption","tagline":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","capabilities":{"vision":true,"reasoning":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream3-preview/detect","name":"Moondream3 Preview [Detect]","created_by":"fal","source":"official","description":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","status":"active","release_date":"2025-10-09","model_type":"other","page_url":"https://fal.run/fal-ai/moondream3-preview/detect","tagline":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","capabilities":{"vision":true,"reasoning":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream3-preview/point","name":"Moondream3 Preview [Point]","created_by":"fal","source":"official","description":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","status":"active","release_date":"2025-10-09","model_type":"other","page_url":"https://fal.run/fal-ai/moondream3-preview/point","tagline":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","capabilities":{"vision":true,"reasoning":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream3-preview/query","name":"Moondream 3 Preview [Query]","created_by":"fal","source":"official","description":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","status":"active","release_date":"2025-10-09","model_type":"other","page_url":"https://fal.run/fal-ai/moondream3-preview/query","tagline":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","capabilities":{"vision":true,"reasoning":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/moondream3-preview/segment","name":"Moondream3 Preview [Segment]","created_by":"fal","source":"official","description":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive inference at scale.","status":"active","release_date":"2025-12-12","model_type":"image","page_url":"https://fal.run/fal-ai/moondream3-preview/segment","tagline":"Moondream 3 is a vision language model that brings frontier-level visual reasoning with native object detection, pointing, and OCR capabilities to real-world applications requiring fast, inexpensive i","capabilities":{"vision":true,"reasoning":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/multishot-master","name":"Multishot Master","created_by":"fal","source":"official","description":"MultiShotMaster is a controllable multi-shot narrative video generation framework that supports text-driven inter-shot consistency, variable shot counts and shot durations, customized subject with mot","status":"active","release_date":"2026-02-24","model_type":"video","page_url":"https://fal.run/fal-ai/multishot-master","tagline":"MultiShotMaster is a controllable multi-shot narrative video generation framework that supports text-driven inter-shot consistency, variable shot counts and shot durations, customized subject with mot","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/musetalk","name":"MuseTalk","created_by":"fal","source":"official","description":"MuseTalk is a real-time high quality audio-driven lip-syncing model.","status":"active","release_date":"2024-04-11","model_type":"video","page_url":"https://fal.run/fal-ai/musetalk","tagline":"MuseTalk is a real-time high quality audio-driven lip-syncing model.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/nafnet/deblur","name":"NAFNet-deblur","created_by":"fal","source":"official","description":"Use NAFNet to fix issues like blurriness and noise in your images.","status":"active","release_date":"2025-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/nafnet/deblur","tagline":"Use NAFNet to fix issues like blurriness and noise in your images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/nafnet/denoise","name":"NAFNet-denoise","created_by":"fal","source":"official","description":"Use NAFNet to fix issues like blurriness and noise in your images.","status":"active","release_date":"2025-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/nafnet/denoise","tagline":"Use NAFNet to fix issues like blurriness and noise in your images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/nano-banana-2/edit","name":"Nano Banana 2","created_by":"fal","source":"official","description":"Nano Banana 2 is Google's new state-of-the-art image generation and editing model\n","status":"active","release_date":"2026-02-26","model_type":"image","page_url":"https://fal.run/fal-ai/nano-banana-2/edit","tagline":"Nano Banana 2 is Google's new state-of-the-art image generation and editing model\n","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/nano-banana-2","name":"Nano Banana 2","created_by":"fal","source":"official","description":"Nano Banana 2 is Google's new state-of-the-art fast image generation and editing model","status":"active","release_date":"2026-02-26","model_type":"image","page_url":"https://fal.run/fal-ai/nano-banana-2","tagline":"Nano Banana 2 is Google's new state-of-the-art fast image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-11","last_updated":"2026-06-18"},{"id":"fal-ai/nano-banana/edit","name":"Nano Banana","created_by":"fal","source":"official","description":"Google's famous original image generation and editing model","status":"active","release_date":"2025-08-19","model_type":"image","page_url":"https://fal.run/fal-ai/nano-banana/edit","tagline":"Google's famous original image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-26","last_updated":"2026-06-29"},{"id":"fal-ai/nano-banana-pro/edit","name":"Nano Banana Pro","created_by":"fal","source":"official","description":"Nano Banana Pro is Google's new state-of-the-art image generation and editing model","status":"active","release_date":"2025-11-20","model_type":"image","page_url":"https://fal.run/fal-ai/nano-banana-pro/edit","tagline":"Nano Banana Pro is Google's new state-of-the-art image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-18","last_updated":"2026-06-20"},{"id":"fal-ai/nano-banana-pro","name":"Nano Banana Pro","created_by":"fal","source":"official","description":"Nano Banana Pro is Google's new state-of-the-art image generation and editing model","status":"active","release_date":"2025-11-20","model_type":"image","page_url":"https://fal.run/fal-ai/nano-banana-pro","tagline":"Nano Banana Pro is Google's new state-of-the-art image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/nano-banana","name":"Nano Banana","created_by":"fal","source":"official","description":"Google's famous original image generation and editing model","status":"active","release_date":"2025-08-19","model_type":"image","page_url":"https://fal.run/fal-ai/nano-banana","tagline":"Google's famous original image generation and editing model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/nemotron-diffusion-vlm","name":"Nemotron Diffusion Vlm","created_by":"fal","source":"official","description":"Nemotron-Labs-Diffusion-VLM-8B is the vision-language extension of the Nemotron-Labs-Diffusion family.","status":"active","release_date":"2026-05-21","model_type":"other","page_url":"https://fal.run/fal-ai/nemotron-diffusion-vlm","tagline":"Nemotron-Labs-Diffusion-VLM-8B is the vision-language extension of the Nemotron-Labs-Diffusion family.","capabilities":{"vision":true},"last_seen_at":"2026-05-21","last_updated":"2026-06-03"},{"id":"fal-ai/nextstep-1","name":"Nextstep 1","created_by":"fal","source":"official","description":"Endpoint for NextStep-1 Autoregressive Image Editing model.","status":"active","release_date":"2025-08-19","model_type":"image","page_url":"https://fal.run/fal-ai/nextstep-1","tagline":"Endpoint for NextStep-1 Autoregressive Image Editing model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/nova-sr","name":"Nova SR","created_by":"fal","source":"official","description":"Enhance muffled 16 kHz speech audio into crystal-clear 48 kHz","status":"active","release_date":"2026-01-13","model_type":"other","page_url":"https://fal.run/fal-ai/nova-sr","tagline":"Enhance muffled 16 kHz speech audio into crystal-clear 48 kHz","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/nucleus-image","name":"Nucleus Image","created_by":"fal","source":"official","description":"Nucleus-Image is a text-to-image generation model built on a sparse mixture-of-experts (MoE) diffusion transformer architecture.","status":"active","release_date":"2026-04-16","model_type":"image","page_url":"https://fal.run/fal-ai/nucleus-image","tagline":"Nucleus-Image is a text-to-image generation model built on a sparse mixture-of-experts (MoE) diffusion transformer architecture.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/object-removal/bbox","name":"Object Removal","created_by":"fal","source":"official","description":"Removes box-selected objects and their visual effects, seamlessly reconstructing the scene with contextually appropriate content.","status":"active","release_date":"2025-06-16","model_type":"image","page_url":"https://fal.run/fal-ai/object-removal/bbox","tagline":"Removes box-selected objects and their visual effects, seamlessly reconstructing the scene with contextually appropriate content.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/object-removal/mask","name":"Object Removal","created_by":"fal","source":"official","description":"Removes mask-selected objects and their visual effects, seamlessly reconstructing the scene with contextually appropriate content.","status":"active","release_date":"2025-06-16","model_type":"image","page_url":"https://fal.run/fal-ai/object-removal/mask","tagline":"Removes mask-selected objects and their visual effects, seamlessly reconstructing the scene with contextually appropriate content.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/object-removal","name":"Object Removal","created_by":"fal","source":"official","description":"Removes objects and their visual effects using natural language, replacing them with contextually appropriate content","status":"active","release_date":"2025-06-16","model_type":"image","page_url":"https://fal.run/fal-ai/object-removal","tagline":"Removes objects and their visual effects using natural language, replacing them with contextually appropriate content","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/omni-zero","name":"Omni Zero","created_by":"fal","source":"official","description":"Any pose, any style, any identity","status":"active","release_date":"2024-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/omni-zero","tagline":"Any pose, any style, any identity","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/omnigen-v1","name":"OmniGen v1","created_by":"fal","source":"official","description":"OmniGen is a unified image generation model that can generate a wide range of images from multi-modal prompts.","status":"active","release_date":"2024-11-29","model_type":"image","page_url":"https://fal.run/fal-ai/omnigen-v1","tagline":"OmniGen is a unified image generation model that can generate a wide range of images from multi-modal prompts.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/omnigen-v2","name":"Omnigen V2","created_by":"fal","source":"official","description":"OmniGen is a unified image generation model that can generate a wide range of images from multi-modal prompts.","status":"active","release_date":"2025-06-25","model_type":"image","page_url":"https://fal.run/fal-ai/omnigen-v2","tagline":"OmniGen is a unified image generation model that can generate a wide range of images from multi-modal prompts.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/omnilottie/image-to-lottie","name":"Omnilottie","created_by":"fal","source":"official","description":"Convert your assets into lottie using Omnilottie.","status":"active","release_date":"2026-03-11","model_type":"other","page_url":"https://fal.run/fal-ai/omnilottie/image-to-lottie","tagline":"Convert your assets into lottie using Omnilottie.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/omnilottie/video-to-lottie","name":"Omnilottie","created_by":"fal","source":"official","description":"Convert your assets into lottie using Omnilottie.","status":"active","release_date":"2026-03-11","model_type":"other","page_url":"https://fal.run/fal-ai/omnilottie/video-to-lottie","tagline":"Convert your assets into lottie using Omnilottie.","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/omnilottie","name":"Omnilottie","created_by":"fal","source":"official","description":"Convert your assets into lottie using Omnilottie.","status":"active","release_date":"2026-03-11","model_type":"other","page_url":"https://fal.run/fal-ai/omnilottie","tagline":"Convert your assets into lottie using Omnilottie.","capabilities":{"structured_output":true,"json_mode":true},"last_seen_at":"2026-03-17","last_updated":"2026-05-11"},{"id":"fal-ai/omnipart","name":"Omnipart","created_by":"fal","source":"official","description":"Image-to-3D endpoint for OmniPart, a part-aware 3D generator with semantic decoupling and structural cohesion.","status":"active","release_date":"2025-10-29","model_type":"other","page_url":"https://fal.run/fal-ai/omnipart","tagline":"Image-to-3D endpoint for OmniPart, a part-aware 3D generator with semantic decoupling and structural cohesion.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/one-to-all-animation/1.3b","name":"One To All Animation","created_by":"fal","source":"official","description":"One-to-All Animation is a pose driven video model that animates characters from a single reference image, enabling flexible, alignment-free motion transfer across diverse styles and scenes","status":"active","release_date":"2025-12-11","model_type":"other","page_url":"https://fal.run/fal-ai/one-to-all-animation/1.3b","tagline":"One-to-All Animation is a pose driven video model that animates characters from a single reference image, enabling flexible, alignment-free motion transfer across diverse styles and scenes","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/one-to-all-animation/14b","name":"One To All Animation","created_by":"fal","source":"official","description":"One-to-All Animation is a pose driven video model that animates characters from a single reference image, enabling flexible, alignment-free motion transfer across diverse styles and scenes","status":"active","release_date":"2025-12-11","model_type":"other","page_url":"https://fal.run/fal-ai/one-to-all-animation/14b","tagline":"One-to-All Animation is a pose driven video model that animates characters from a single reference image, enabling flexible, alignment-free motion transfer across diverse styles and scenes","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/onereward","name":"Onereward","created_by":"fal","source":"official","description":"OneReward is a finetuned version of Flux 1.0 Fill with intelligent editing capabilities.","status":"active","release_date":"2026-03-05","model_type":"image","page_url":"https://fal.run/fal-ai/onereward","tagline":"OneReward is a finetuned version of Flux 1.0 Fill with intelligent editing capabilities.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-05","last_updated":"2026-05-11"},{"id":"fal-ai/orpheus-tts","name":"Orpheus TTS","created_by":"fal","source":"official","description":"Orpheus TTS is a state-of-the-art, Llama-based Speech-LLM designed for high-quality, empathetic text-to-speech generation.","status":"active","release_date":"2025-03-31","model_type":"tts","page_url":"https://fal.run/fal-ai/orpheus-tts","tagline":"Orpheus TTS is a state-of-the-art, Llama-based Speech-LLM designed for high-quality, empathetic text-to-speech generation.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ovi/image-to-video","name":"Ovi","created_by":"fal","source":"official","description":"Ovi can generate videos with audio from image and text inputs.","status":"active","release_date":"2025-10-03","model_type":"video","page_url":"https://fal.run/fal-ai/ovi/image-to-video","tagline":"Ovi can generate videos with audio from image and text inputs.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ovi","name":"Ovi Text to Video","created_by":"fal","source":"official","description":"A unified paradigm for audio-video generation","status":"active","release_date":"2025-10-03","model_type":"video","page_url":"https://fal.run/fal-ai/ovi","tagline":"A unified paradigm for audio-video generation","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ovis-image","name":"Ovis Image","created_by":"fal","source":"official","description":"Ovis-Image is a 7B text-to-image model specifically optimized for quick, high quality text rendering.","status":"active","release_date":"2025-11-29","model_type":"image","page_url":"https://fal.run/fal-ai/ovis-image","tagline":"Ovis-Image is a 7B text-to-image model specifically optimized for quick, high quality text rendering.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pasd","name":"PASD","created_by":"fal","source":"official","description":"Pixel-Aware Diffusion Model for Realistic Image Super-Resolution and Personalized Stylization","status":"active","release_date":"2025-06-17","model_type":"image","page_url":"https://fal.run/fal-ai/pasd","tagline":"Pixel-Aware Diffusion Model for Realistic Image Super-Resolution and Personalized Stylization","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/patina/material/extract","name":"PATINA","created_by":"fal","source":"official","description":"Extract seamless tiling textures with PBR attribute maps from images","status":"active","release_date":"2026-04-08","model_type":"image","page_url":"https://fal.run/fal-ai/patina/material/extract","tagline":"Extract seamless tiling textures with PBR attribute maps from images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/patina/material","name":"PATINA","created_by":"fal","source":"official","description":"Generate complete seamlessly tiling PBR materials including normal, roughness, basecolor, height and metalness maps up to 8K","status":"active","release_date":"2026-04-08","model_type":"image","page_url":"https://fal.run/fal-ai/patina/material","tagline":"Generate complete seamlessly tiling PBR materials including normal, roughness, basecolor, height and metalness maps up to 8K","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/patina","name":"PATINA","created_by":"fal","source":"official","description":"PATINA creates seamless high-resolution normal, roughness, basecolor (albedo), height (displacement) and metalness maps from images","status":"active","release_date":"2026-04-08","model_type":"image","page_url":"https://fal.run/fal-ai/patina","tagline":"PATINA creates seamless high-resolution normal, roughness, basecolor (albedo), height (displacement) and metalness maps from images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/personaplex/realtime","name":"Personaplex","created_by":"fal","source":"official","description":"PersonaPlex is a real-time, full-duplex speech-to-speech conversational model that enables persona control through text-based role prompts and audio-based voice conditioning.","status":"active","release_date":"2026-02-20","model_type":"other","page_url":"https://fal.run/fal-ai/personaplex/realtime","tagline":"PersonaPlex is a real-time, full-duplex speech-to-speech conversational model that enables persona control through text-based role prompts and audio-based voice conditioning.","last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"fal-ai/personaplex","name":"Personaplex","created_by":"fal","source":"official","description":"PersonaPlex is a real-time, full-duplex speech-to-speech conversational model that enables persona control through text-based role prompts and audio-based voice conditioning.","status":"active","release_date":"2026-02-12","model_type":"other","page_url":"https://fal.run/fal-ai/personaplex","tagline":"PersonaPlex is a real-time, full-duplex speech-to-speech conversational model that enables persona control through text-based role prompts and audio-based voice conditioning.","capabilities":{"streaming":true},"last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"fal-ai/phota/create-profile","name":"Phota Create Profile","created_by":"fal","source":"official","description":"Generate profiles using 30-50 images of a subject with Phota.","status":"active","release_date":"2026-03-26","model_type":"other","page_url":"https://fal.run/fal-ai/phota/create-profile","tagline":"Generate profiles using 30-50 images of a subject with Phota.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/phota/edit","name":"Phota","created_by":"fal","source":"official","description":"Phota's model enables personalized photo editing, preserving identity while erasing distractions seamlessly.","status":"active","release_date":"2026-03-26","model_type":"image","page_url":"https://fal.run/fal-ai/phota/edit","tagline":"Phota's model enables personalized photo editing, preserving identity while erasing distractions seamlessly.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-27","last_updated":"2026-06-03"},{"id":"fal-ai/phota/enhance","name":"Phota Enhance","created_by":"fal","source":"official","description":"Enhance images while preserving identities with Phota","status":"active","release_date":"2026-03-26","model_type":"image","page_url":"https://fal.run/fal-ai/phota/enhance","tagline":"Enhance images while preserving identities with Phota","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-27","last_updated":"2026-06-03"},{"id":"fal-ai/phota","name":"Phota Text to Image","created_by":"fal","source":"official","description":"Phota's model empowers developers, photographers, and creators with personalized photograph generation and editing.","status":"active","release_date":"2026-03-26","model_type":"image","page_url":"https://fal.run/fal-ai/phota","tagline":"Phota's model empowers developers, photographers, and creators with personalized photograph generation and editing.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-27","last_updated":"2026-06-03"},{"id":"fal-ai/photomaker","name":"PhotoMaker","created_by":"fal","source":"official","description":"Customizing Realistic Human Photos via Stacked ID Embedding","status":"active","release_date":"2024-03-08","model_type":"image","page_url":"https://fal.run/fal-ai/photomaker","tagline":"Customizing Realistic Human Photos via Stacked ID Embedding","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/physic-edit","name":"Physic Edit","created_by":"fal","source":"official","description":"Physics-aware image editing with PhysicEdit.","status":"active","release_date":"2026-03-12","model_type":"image","page_url":"https://fal.run/fal-ai/physic-edit","tagline":"Physics-aware image editing with PhysicEdit.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-12","last_updated":"2026-05-11"},{"id":"fal-ai/piflow","name":"Piflow","created_by":"fal","source":"official","description":"Use the faster speed of piflow to generate images with same quality to that of slower models.","status":"active","release_date":"2025-10-27","model_type":"image","page_url":"https://fal.run/fal-ai/piflow","tagline":"Use the faster speed of piflow to generate images with same quality to that of slower models.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v1.5/pikaffects","name":"Pika Effects (v1.5)","created_by":"fal","source":"official","description":"Pika Effects are AI-powered video effects designed to modify objects, characters, and environments in a fun, engaging, and visually compelling manner.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v1.5/pikaffects","tagline":"Pika Effects are AI-powered video effects designed to modify objects, characters, and environments in a fun, engaging, and visually compelling manner.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2/pikadditions","name":"Pikadditions (v2)","created_by":"fal","source":"official","description":"Pikadditions is a powerful video-to-video AI model that allows you to add anyone or anything to any video with seamless integration.","status":"active","release_date":"2025-03-14","model_type":"other","page_url":"https://fal.run/fal-ai/pika/v2/pikadditions","tagline":"Pikadditions is a powerful video-to-video AI model that allows you to add anyone or anything to any video with seamless integration.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2/turbo/image-to-video","name":"Pika Image to Video Turbo (v2)","created_by":"fal","source":"official","description":"Turbo is the model to use when you feel the need for speed.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2/turbo/image-to-video","tagline":"Turbo is the model to use when you feel the need for speed.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2/turbo/text-to-video","name":"Pika Text to Video Turbo (v2)","created_by":"fal","source":"official","description":"Pika v2 Turbo creates videos from a text prompt with high quality output.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2/turbo/text-to-video","tagline":"Pika v2 Turbo creates videos from a text prompt with high quality output.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2.1/image-to-video","name":"Pika Image to Video (v2.1)","created_by":"fal","source":"official","description":"Turn photos into mind-blowing, dynamic videos.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2.1/image-to-video","tagline":"Turn photos into mind-blowing, dynamic videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2.1/text-to-video","name":"Pika Text to Video (v2.1)","created_by":"fal","source":"official","description":"Start with a simple text input to create dynamic generations that defy expectations.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2.1/text-to-video","tagline":"Start with a simple text input to create dynamic generations that defy expectations.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2.2/image-to-video","name":"Pika Image to Video (v2.2)","created_by":"fal","source":"official","description":"Turn photos into mind-blowing, dynamic videos in up to 1080p.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2.2/image-to-video","tagline":"Turn photos into mind-blowing, dynamic videos in up to 1080p.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2.2/pikaframes","name":"Pika","created_by":"fal","source":"official","description":"Discover ultimate control with Pikaframes key frame interpolation, a stunning image-to-video feature that allows you to upload up to 5 keyframes, customize their transition length and prompt, and see ","status":"active","release_date":"2025-11-07","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2.2/pikaframes","tagline":"Discover ultimate control with Pikaframes key frame interpolation, a stunning image-to-video feature that allows you to upload up to 5 keyframes, customize their transition length and prompt, and see ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2.2/pikascenes","name":"Pika Scenes (v2.2)","created_by":"fal","source":"official","description":"Pika Scenes v2.2 creates videos from a images with high quality output.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2.2/pikascenes","tagline":"Pika Scenes v2.2 creates videos from a images with high quality output.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pika/v2.2/text-to-video","name":"Pika Text to Video (v2.2)","created_by":"fal","source":"official","description":"Start with a simple text input to create dynamic generations that defy expectations in up to 1080p.","status":"active","release_date":"2025-03-14","model_type":"video","page_url":"https://fal.run/fal-ai/pika/v2.2/text-to-video","tagline":"Start with a simple text input to create dynamic generations that defy expectations in up to 1080p.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pixal3d","name":"Pixal3d","created_by":"fal","source":"official","description":"Pixal3D turns a single image into a high-fidelity 3D model with detailed geometry and realistic textures.","status":"active","release_date":"2026-05-13","model_type":"other","page_url":"https://fal.run/fal-ai/pixal3d","tagline":"Pixal3D turns a single image into a high-fidelity 3D model with detailed geometry and realistic textures.","capabilities":{"vision":true},"last_seen_at":"2026-05-22","last_updated":"2026-06-03"},{"id":"fal-ai/pixart-sigma","name":"PixArt-Σ","created_by":"fal","source":"official","description":"Weak-to-Strong Training of Diffusion Transformer for 4K Text-to-Image Generation","status":"active","release_date":"2024-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/pixart-sigma","tagline":"Weak-to-Strong Training of Diffusion Transformer for 4K Text-to-Image Generation","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/pixverse/c1/image-to-video","name":"PixVerse C1 Image To Video","created_by":"fal","source":"official","description":"Animate images into cinematic videos with PixVerse C1, supporting 1080p resolution and native audio generation.","status":"active","release_date":"2026-04-08","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/c1/image-to-video","tagline":"Animate images into cinematic videos with PixVerse C1, supporting 1080p resolution and native audio generation.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/c1/reference-to-video","name":"PixVerse C1 Reference To Video","created_by":"fal","source":"official","description":"Generate character-consistent videos from reference images using PixVerse C1, with subject and background references.","status":"active","release_date":"2026-04-08","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/c1/reference-to-video","tagline":"Generate character-consistent videos from reference images using PixVerse C1, with subject and background references.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/c1/text-to-video","name":"PixVerse C1 Text To Video","created_by":"fal","source":"official","description":"Generate film-grade videos from text prompts with native audio, up to 1080p and 15 seconds, using PixVerse C1.","status":"active","release_date":"2026-04-08","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/c1/text-to-video","tagline":"Generate film-grade videos from text prompts with native audio, up to 1080p and 15 seconds, using PixVerse C1.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/c1/transition","name":"PixVerse C1 Transition","created_by":"fal","source":"official","description":"Create seamless cinematic transitions between two images with PixVerse C1, with native audio and up to 1080p.","status":"active","release_date":"2026-04-08","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/c1/transition","tagline":"Create seamless cinematic transitions between two images with PixVerse C1, with native audio and up to 1080p.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/extend/fast","name":"PixVerse Extend Fast","created_by":"fal","source":"official","description":"PixVerse Extend model is a video extending tool for your videos using with high-quality video extending techniques ","status":"active","release_date":"2025-06-30","model_type":"other","page_url":"https://fal.run/fal-ai/pixverse/extend/fast","tagline":"PixVerse Extend model is a video extending tool for your videos using with high-quality video extending techniques ","capabilities":{"tool_call":true},"tools":["function_calling"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/extend","name":"PixVerse Extend","created_by":"fal","source":"official","description":"PixVerse Extend model is a video extending tool for your videos using with high-quality video extending techniques ","status":"active","release_date":"2025-06-30","model_type":"other","page_url":"https://fal.run/fal-ai/pixverse/extend","tagline":"PixVerse Extend model is a video extending tool for your videos using with high-quality video extending techniques ","capabilities":{"tool_call":true},"tools":["function_calling"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/lipsync","name":"PixVerse Lipsync","created_by":"fal","source":"official","description":"Generate realistic lipsync animations from audio using advanced algorithms for high-quality synchronization with PixVerse Lipsync model","status":"active","release_date":"2025-06-30","model_type":"other","page_url":"https://fal.run/fal-ai/pixverse/lipsync","tagline":"Generate realistic lipsync animations from audio using advanced algorithms for high-quality synchronization with PixVerse Lipsync model","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/pixverse/sound-effects","name":"PixVerse Sound Effects","created_by":"fal","source":"official","description":"Add immersive sound effects and background music to your videos using PixVerse sound effects generation","status":"active","release_date":"2025-07-07","model_type":"other","page_url":"https://fal.run/fal-ai/pixverse/sound-effects","tagline":"Add immersive sound effects and background music to your videos using PixVerse sound effects generation","last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/swap","name":"PixVerse Swap","created_by":"fal","source":"official","description":"Generate high quality video clips by swapping person, objects and background using Pixverse Swap.","status":"active","release_date":"2025-11-10","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/swap","tagline":"Generate high quality video clips by swapping person, objects and background using Pixverse Swap.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v3.5/effects","name":"PixVerse V3.5 Effects","created_by":"fal","source":"official","description":"Generate high quality video clips with different effects using PixVerse v3.5","status":"active","release_date":"2025-04-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v3.5/effects","tagline":"Generate high quality video clips with different effects using PixVerse v3.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v3.5/image-to-video/fast","name":"PixVerse V3.5 Image To Video Fast","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts quickly using PixVerse v3.5 Fast","status":"active","release_date":"2025-01-29","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v3.5/image-to-video/fast","tagline":"Generate high quality video clips from text and image prompts quickly using PixVerse v3.5 Fast","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v3.5/image-to-video","name":"PixVerse V3.5 Image To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v3.5","status":"active","release_date":"2025-01-29","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v3.5/image-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v3.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v3.5/text-to-video/fast","name":"PixVerse V3.5 Text To Video Fast","created_by":"fal","source":"official","description":"Generate high quality video clips quickly from text prompts using PixVerse v3.5 Fast","status":"active","release_date":"2025-01-29","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v3.5/text-to-video/fast","tagline":"Generate high quality video clips quickly from text prompts using PixVerse v3.5 Fast","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v3.5/text-to-video","name":"PixVerse V3.5 Text To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text prompts using PixVerse v3.5","status":"active","release_date":"2025-01-29","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v3.5/text-to-video","tagline":"Generate high quality video clips from text prompts using PixVerse v3.5","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v3.5/transition","name":"PixVerse V3.5 Transition","created_by":"fal","source":"official","description":"Create seamless transition between images using PixVerse v3.5","status":"active","release_date":"2025-04-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v3.5/transition","tagline":"Create seamless transition between images using PixVerse v3.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4/effects","name":"PixVerse V4 Effects","created_by":"fal","source":"official","description":"Generate high quality video clips with different effects using PixVerse v4","status":"active","release_date":"2025-04-23","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4/effects","tagline":"Generate high quality video clips with different effects using PixVerse v4","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4/image-to-video/fast","name":"PixVerse V4 Image To Video Fast","created_by":"fal","source":"official","description":"Generate fast high quality video clips from text and image prompts using PixVerse v4","status":"active","release_date":"2025-04-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4/image-to-video/fast","tagline":"Generate fast high quality video clips from text and image prompts using PixVerse v4","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4/image-to-video","name":"PixVerse V4 Image To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v4","status":"active","release_date":"2025-04-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4/image-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v4","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4/text-to-video/fast","name":"PixVerse V4 Text To Video Fast","created_by":"fal","source":"official","description":"Generate high quality and fast video clips from text and image prompts using PixVerse v4 fast","status":"active","release_date":"2025-04-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4/text-to-video/fast","tagline":"Generate high quality and fast video clips from text and image prompts using PixVerse v4 fast","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4/text-to-video","name":"PixVerse V4 Text To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v4","status":"active","release_date":"2025-04-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4/text-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v4","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4.5/effects","name":"PixVerse V4.5 Effects","created_by":"fal","source":"official","description":"Generate high quality video clips with different effects using PixVerse v4.5","status":"active","release_date":"2025-05-15","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4.5/effects","tagline":"Generate high quality video clips with different effects using PixVerse v4.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4.5/image-to-video/fast","name":"PixVerse V4.5 Image To Video Fast","created_by":"fal","source":"official","description":"Generate fast high quality video clips from text and image prompts using PixVerse v4.5","status":"active","release_date":"2025-05-15","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4.5/image-to-video/fast","tagline":"Generate fast high quality video clips from text and image prompts using PixVerse v4.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4.5/image-to-video","name":"PixVerse V4.5 Image To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v4.5","status":"active","release_date":"2025-05-15","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4.5/image-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v4.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4.5/text-to-video/fast","name":"PixVerse V4.5 Text To Video Fast","created_by":"fal","source":"official","description":"Generate high quality and fast video clips from text and image prompts using PixVerse v4.5 fast","status":"active","release_date":"2025-05-15","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4.5/text-to-video/fast","tagline":"Generate high quality and fast video clips from text and image prompts using PixVerse v4.5 fast","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4.5/text-to-video","name":"PixVerse V4.5 Text To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v4.5","status":"active","release_date":"2025-05-15","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4.5/text-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v4.5","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v4.5/transition","name":"PixVerse V4.5 Transition","created_by":"fal","source":"official","description":"Create seamless transition between images using PixVerse v4.5","status":"active","release_date":"2025-05-15","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v4.5/transition","tagline":"Create seamless transition between images using PixVerse v4.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v5/effects","name":"PixVerse V5 Effects","created_by":"fal","source":"official","description":"Generate high quality video clips with different effects using PixVerse v5","status":"active","release_date":"2025-08-23","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5/effects","tagline":"Generate high quality video clips with different effects using PixVerse v5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v5/image-to-video","name":"PixVerse V5 Image To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v5","status":"active","release_date":"2025-08-23","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5/image-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/pixverse/v5/text-to-video","name":"PixVerse V5 Text To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v5","status":"active","release_date":"2025-08-23","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5/text-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v5","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v5/transition","name":"PixVerse V5 Transition","created_by":"fal","source":"official","description":"Create seamless transition between images using PixVerse v5","status":"active","release_date":"2025-08-23","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5/transition","tagline":"Create seamless transition between images using PixVerse v5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v5.5/effects","name":"PixVerse V5.5 Effects","created_by":"fal","source":"official","description":"Pixverse Effects","status":"active","release_date":"2025-12-02","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5.5/effects","tagline":"Pixverse Effects","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/pixverse/v5.5/image-to-video","name":"PixVerse V5.5 Image To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v5.5","status":"active","release_date":"2025-12-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5.5/image-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v5.5","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/pixverse/v5.5/text-to-video","name":"PixVerse V5.5 Text To Video","created_by":"fal","source":"official","description":"Generate high quality video clips from text and image prompts using PixVerse v5.5","status":"active","release_date":"2025-12-01","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5.5/text-to-video","tagline":"Generate high quality video clips from text and image prompts using PixVerse v5.5","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/pixverse/v5.5/transition","name":"PixVerse V5.5 Transition","created_by":"fal","source":"official","description":"Pixverse Transition","status":"active","release_date":"2025-12-02","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5.5/transition","tagline":"Pixverse Transition","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/pixverse/v5.6/image-to-video","name":"PixVerse V5.6 Image To Video","created_by":"fal","source":"official","description":"Use the latest pixverse v5.6 model to turn your texts and images into amazing videos.","status":"active","release_date":"2026-01-26","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5.6/image-to-video","tagline":"Use the latest pixverse v5.6 model to turn your texts and images into amazing videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v5.6/text-to-video","name":"PixVerse V5.6 Text To Video","created_by":"fal","source":"official","description":"Use the latest pixverse v5.6 model to turn your texts into amazing videos.","status":"active","release_date":"2026-01-26","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5.6/text-to-video","tagline":"Use the latest pixverse v5.6 model to turn your texts into amazing videos.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v5.6/transition","name":"PixVerse V5.6 Transition","created_by":"fal","source":"official","description":"Use the latest pixverse v5.6 model to turn your texts and images into amazing videos.","status":"active","release_date":"2026-01-26","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v5.6/transition","tagline":"Use the latest pixverse v5.6 model to turn your texts and images into amazing videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/pixverse/v6/extend","name":"PixVerse V6 Extend","created_by":"fal","source":"official","description":"Pixverse's latest v6 Model.","status":"active","release_date":"2026-03-29","model_type":"other","page_url":"https://fal.run/fal-ai/pixverse/v6/extend","tagline":"Pixverse's latest v6 Model.","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/pixverse/v6/image-to-video","name":"PixVerse V6 Image To Video","created_by":"fal","source":"official","description":"Pixverse's latest V6 Model","status":"active","release_date":"2026-03-29","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v6/image-to-video","tagline":"Pixverse's latest V6 Model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v6/text-to-video","name":"PixVerse V6 Text To Video","created_by":"fal","source":"official","description":"Pixverse's latest v6 Model.","status":"active","release_date":"2026-03-29","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v6/text-to-video","tagline":"Pixverse's latest v6 Model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/pixverse/v6/transition","name":"PixVerse V6 Transition","created_by":"fal","source":"official","description":"Pixverse's latest v6 Model.","status":"active","release_date":"2026-03-29","model_type":"video","page_url":"https://fal.run/fal-ai/pixverse/v6/transition","tagline":"Pixverse's latest v6 Model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/playground-v25/image-to-image","name":"Playground v2.5","created_by":"fal","source":"official","description":"State-of-the-art open-source model in aesthetic quality","status":"active","release_date":"2024-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/playground-v25/image-to-image","tagline":"State-of-the-art open-source model in aesthetic quality","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/playground-v25/inpainting","name":"Playground v2.5","created_by":"fal","source":"official","description":"State-of-the-art open-source model in aesthetic quality","status":"active","release_date":"2024-02-21","model_type":"image","page_url":"https://fal.run/fal-ai/playground-v25/inpainting","tagline":"State-of-the-art open-source model in aesthetic quality","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/playground-v25","name":"Playground v2.5","created_by":"fal","source":"official","description":"State-of-the-art open-source model in aesthetic quality","status":"active","release_date":"2024-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/playground-v25","tagline":"State-of-the-art open-source model in aesthetic quality","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/plushify","name":"Plushify","created_by":"fal","source":"official","description":"Turn any image into a cute plushie!","status":"active","release_date":"2025-04-20","model_type":"image","page_url":"https://fal.run/fal-ai/plushify","tagline":"Turn any image into a cute plushie!","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pony-v7","name":"Pony V7","created_by":"fal","source":"official","description":"Pony V7 is a finetuned text to image for superior aesthetics and prompt following.","status":"active","release_date":"2025-05-05","model_type":"image","page_url":"https://fal.run/fal-ai/pony-v7","tagline":"Pony V7 is a finetuned text to image for superior aesthetics and prompt following.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/post-processing/blur","name":"Post Processing Blur","created_by":"fal","source":"official","description":"Apply Gaussian or Kuwahara blur effects with adjustable radius and sigma parameters","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/blur","tagline":"Apply Gaussian or Kuwahara blur effects with adjustable radius and sigma parameters","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/chromatic-aberration","name":"Post Processing Chromatic Aberration","created_by":"fal","source":"official","description":"Create chromatic aberration by shifting red, green, and blue channels horizontally or vertically with customizable shift amounts.","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/chromatic-aberration","tagline":"Create chromatic aberration by shifting red, green, and blue channels horizontally or vertically with customizable shift amounts.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/color-correction","name":"Post Processing Color Correction","created_by":"fal","source":"official","description":"Adjust color temperature, brightness, contrast, saturation, and gamma values for color correction.","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/color-correction","tagline":"Adjust color temperature, brightness, contrast, saturation, and gamma values for color correction.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/post-processing/color-tint","name":"Post Processing Color Tint","created_by":"fal","source":"official","description":"Apply various color tints (sepia, red, green, blue, cyan, magenta, yellow, purple, orange, warm, cool, lime, navy, vintage, rose, teal, maroon, peach, lavender, olive) with adjustable strength.","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/color-tint","tagline":"Apply various color tints (sepia, red, green, blue, cyan, magenta, yellow, purple, orange, warm, cool, lime, navy, vintage, rose, teal, maroon, peach, lavender, olive) with adjustable strength.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/desaturate","name":"Post Processing Desaturate","created_by":"fal","source":"official","description":"Reduce color saturation using different methods (luminance Rec.709, luminance Rec.601, average, lightness) with adjustable factor.","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/desaturate","tagline":"Reduce color saturation using different methods (luminance Rec.709, luminance Rec.601, average, lightness) with adjustable factor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/dissolve","name":"Post Processing Dissolve","created_by":"fal","source":"official","description":"Blend two images together using smooth linear interpolation with a configurable blend factor.","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/dissolve","tagline":"Blend two images together using smooth linear interpolation with a configurable blend factor.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/dodge-burn","name":"Post Processing Dodge Burn","created_by":"fal","source":"official","description":"Apply dodge and burn effects with multiple modes and adjustable intensity.","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/dodge-burn","tagline":"Apply dodge and burn effects with multiple modes and adjustable intensity.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/grain","name":"Post Processing Grain","created_by":"fal","source":"official","description":"Apply film grain effect with different styles (modern, analog, kodak, fuji, cinematic, newspaper) and customizable intensity and scale","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/grain","tagline":"Apply film grain effect with different styles (modern, analog, kodak, fuji, cinematic, newspaper) and customizable intensity and scale","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/parabolize","name":"Post Processing Parabolize","created_by":"fal","source":"official","description":"Apply a parabolic distortion effect with configurable coefficient and vertex position.","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/parabolize","tagline":"Apply a parabolic distortion effect with configurable coefficient and vertex position.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/post-processing/sharpen","name":"Post Processing Sharpen","created_by":"fal","source":"official","description":"Apply sharpening effects with three modes: basic unsharp mask, smart sharpening with edge preservation, and Contrast Adaptive Sharpening (CAS).","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/sharpen","tagline":"Apply sharpening effects with three modes: basic unsharp mask, smart sharpening with edge preservation, and Contrast Adaptive Sharpening (CAS).","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/post-processing/solarize","name":"Post Processing Solarize","created_by":"fal","source":"official","description":"Apply solarization effect by inverting pixel values above a threshold","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/solarize","tagline":"Apply solarization effect by inverting pixel values above a threshold","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/post-processing/vignette","name":"Post Processing Vignette","created_by":"fal","source":"official","description":"Add a darkening vignette effect around the edges of the image with adjustable strength","status":"active","release_date":"2025-07-01","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing/vignette","tagline":"Add a darkening vignette effect around the edges of the image with adjustable strength","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/post-processing","name":"Post Processing","created_by":"fal","source":"official","description":"Post Processing is an endpoint that can enhance images using a variety of techniques including grain, blur, sharpen, and more.","status":"active","release_date":"2025-02-18","model_type":"image","page_url":"https://fal.run/fal-ai/post-processing","tagline":"Post Processing is an endpoint that can enhance images using a variety of techniques including grain, blur, sharpen, and more.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pshuman","name":"Pshuman","created_by":"fal","source":"official","description":"Use the 6D pose estimation capabilities of PSHuman to generate 3D files from single image.","status":"active","release_date":"2025-09-13","model_type":"other","page_url":"https://fal.run/fal-ai/pshuman","tagline":"Use the 6D pose estimation capabilities of PSHuman to generate 3D files from single image.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/pulid","name":"PuLID","created_by":"fal","source":"official","description":"Tuning-free ID customization.","status":"active","release_date":"2023-12-14","model_type":"image","page_url":"https://fal.run/fal-ai/pulid","tagline":"Tuning-free ID customization.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/qwen-3-guard","name":"Qwen 3 Guard [8B]","created_by":"fal","source":"official","family":"qwen","description":"Use Qwen 3 Guard [8B] to detect and classify text as safe or harmful, delivering precise and reliable safety categorization.","status":"active","release_date":"2025-10-20","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-3-guard","tagline":"Use Qwen 3 Guard [8B] to detect and classify text as safe or harmful, delivering precise and reliable safety categorization.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-3-tts/clone-voice/0.6b","name":"Qwen 3 TTS - Clone Voice [0.6B]","created_by":"fal","source":"official","family":"qwen","description":"Clone your voices using Qwen3-TTS Clone-Voice model with zero shot cloning capabilities and use it on text-to-speech models to create speeches of yours!","status":"active","release_date":"2026-01-26","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-3-tts/clone-voice/0.6b","tagline":"Clone your voices using Qwen3-TTS Clone-Voice model with zero shot cloning capabilities and use it on text-to-speech models to create speeches of yours!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-3-tts/clone-voice/1.7b","name":"Qwen 3 TTS - Clone Voice [1.7B]","created_by":"fal","source":"official","family":"qwen","description":"Clone your voices using Qwen3-TTS Clone-Voice model with zero shot cloning capabilities and use it on text-to-speech models to create speeches of yours!","status":"active","release_date":"2026-01-26","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-3-tts/clone-voice/1.7b","tagline":"Clone your voices using Qwen3-TTS Clone-Voice model with zero shot cloning capabilities and use it on text-to-speech models to create speeches of yours!","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-3-tts/text-to-speech/0.6b","name":"Qwen 3 TTS - Text to Speech [0.6B]","created_by":"fal","source":"official","family":"qwen","description":"Bring speech to your texts using Qwen3-TTS Custom-Voice model with pre-trained voices or use your custom voice with Qwen3-TTS Clone Voice model","status":"active","release_date":"2026-01-26","model_type":"tts","page_url":"https://fal.run/fal-ai/qwen-3-tts/text-to-speech/0.6b","tagline":"Bring speech to your texts using Qwen3-TTS Custom-Voice model with pre-trained voices or use your custom voice with Qwen3-TTS Clone Voice model","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-3-tts/text-to-speech/1.7b","name":"Qwen 3 TTS - Text to Speech [1.7B]","created_by":"fal","source":"official","family":"qwen","description":"Bring speech to your texts using Qwen3-TTS Custom-Voice model with pre-trained voices or use your custom voice with Qwen3-TTS Clone Voice model","status":"active","release_date":"2026-01-26","model_type":"tts","page_url":"https://fal.run/fal-ai/qwen-3-tts/text-to-speech/1.7b","tagline":"Bring speech to your texts using Qwen3-TTS Custom-Voice model with pre-trained voices or use your custom voice with Qwen3-TTS Clone Voice model","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-3-tts/voice-design/1.7b","name":"Qwen 3 TTS - Voice Design [1.7B]","created_by":"fal","source":"official","family":"qwen","description":"Create custom voices using Qwen3-TTS Voice Design model and later use Clone Voice model to create your own voices!","status":"active","release_date":"2026-01-26","model_type":"tts","page_url":"https://fal.run/fal-ai/qwen-3-tts/voice-design/1.7b","tagline":"Create custom voices using Qwen3-TTS Voice Design model and later use Clone Voice model to create your own voices!","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2/edit","name":"Qwen Image 2","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","status":"active","release_date":"2026-03-03","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-2/edit","tagline":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2/pro/edit","name":"Qwen Image 2","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","status":"active","release_date":"2026-03-03","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-2/pro/edit","tagline":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2/pro/text-to-image","name":"Qwen Image 2","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","status":"active","release_date":"2026-03-03","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-2/pro/text-to-image","tagline":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2/text-to-image","name":"Qwen Image 2","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","status":"active","release_date":"2026-03-03","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-2/text-to-image","tagline":"Qwen-Image-2.0 is a next-generation foundational unified generation-and-editing model","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2512/lora","name":"Qwen Image 2512","created_by":"fal","source":"official","family":"qwen","description":"LoRA inference endpoint for Qwen Image 2512, an improved version of Qwen Image with better text rendering, finer natural textures, and more realistic human generation.","status":"active","release_date":"2026-01-02","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-2512/lora","tagline":"LoRA inference endpoint for Qwen Image 2512, an improved version of Qwen Image with better text rendering, finer natural textures, and more realistic human generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2512-trainer-v2","name":"Qwen Image 2512 Trainer V2","created_by":"fal","source":"official","family":"qwen","description":"Fast LoRA trainer for Qwen-Image-2512","status":"active","release_date":"2026-01-15","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-2512-trainer-v2","tagline":"Fast LoRA trainer for Qwen-Image-2512","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2512-trainer","name":"Qwen Image 2512 Trainer","created_by":"fal","source":"official","family":"qwen","description":"Qwen Image 2512 LoRA training","status":"active","release_date":"2026-01-01","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-2512-trainer","tagline":"Qwen Image 2512 LoRA training","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-2512","name":"Qwen Image 2512","created_by":"fal","source":"official","family":"qwen","description":"Qwen Image 2512 is an improved version of Qwen Image with better text rendering, finer natural textures, and more realistic human generation.","status":"active","release_date":"2025-12-30","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-2512","tagline":"Qwen Image 2512 is an improved version of Qwen Image with better text rendering, finer natural textures, and more realistic human generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/add-background","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Add a realistic scene behind the object with white background","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/add-background","tagline":"Add a realistic scene behind the object with white background","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/face-to-full-portrait","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Generate full portrait from a cropped face photo","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/face-to-full-portrait","tagline":"Generate full portrait from a cropped face photo","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/group-photo","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Create group photos ","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/group-photo","tagline":"Create group photos ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/integrate-product","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Blend products into backgrounds with automatic perspective and lighting correction","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/integrate-product","tagline":"Blend products into backgrounds with automatic perspective and lighting correction","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/lighting-restoration","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Removes harsh shadows and light spots from images, replacing them with soft, even, natural-looking illumination.","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/lighting-restoration","tagline":"Removes harsh shadows and light spots from images, replacing them with soft, even, natural-looking illumination.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/multiple-angles","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Precise camera position and angle control (rotation, zoom, vertical movement)","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/multiple-angles","tagline":"Precise camera position and angle control (rotation, zoom, vertical movement)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/next-scene","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Create cinematic transitions and scene progressions (camera movements, framing changes)","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/next-scene","tagline":"Create cinematic transitions and scene progressions (camera movements, framing changes)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/remove-element","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Remove unwanted elements (objects, people, text) while maintaining image consistency","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/remove-element","tagline":"Remove unwanted elements (objects, people, text) while maintaining image consistency","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/remove-lighting","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Remove existing lighting and apply soft, even illumination","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/remove-lighting","tagline":"Remove existing lighting and apply soft, even illumination","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora-gallery/shirt-design","name":"Qwen Image Edit 2509 Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Apply designs/graphics onto people's shirts","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora-gallery/shirt-design","tagline":"Apply designs/graphics onto people's shirts","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-lora","name":"Qwen Image Edit 2509 Lora","created_by":"fal","source":"official","family":"qwen","description":"LoRA endpoint for the Qwen Image Edit 2509 model.","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-lora","tagline":"LoRA endpoint for the Qwen Image Edit 2509 model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509-trainer","name":"Qwen Image Edit 2509 Trainer","created_by":"fal","source":"official","family":"qwen","description":"LoRA trainer for Qwen Image Edit 2509","status":"active","release_date":"2025-12-15","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509-trainer","tagline":"LoRA trainer for Qwen Image Edit 2509","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2509","name":"Qwen Image Edit 2509","created_by":"fal","source":"official","family":"qwen","description":"Endpoint for Qwen's Image Editing Plus model also known as Qwen-Image-Edit-2509.","status":"active","release_date":"2025-12-15","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2509","tagline":"Endpoint for Qwen's Image Editing Plus model also known as Qwen-Image-Edit-2509.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2511/lora","name":"Qwen Image Edit 2511","created_by":"fal","source":"official","family":"qwen","description":"Endpoint for Qwen's Image Editing 2511 model with LoRa support.","status":"active","release_date":"2025-12-30","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2511/lora","tagline":"Endpoint for Qwen's Image Editing 2511 model with LoRa support.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2511-multiple-angles","name":"Qwen Image Edit 2511 Multiple Angles","created_by":"fal","source":"official","family":"qwen","description":"Generates same scene from different angles (azimuth/elevation) with Qwen image Edit 2511 and the Lora Multiple Angles","status":"active","release_date":"2026-01-07","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2511-multiple-angles","tagline":"Generates same scene from different angles (azimuth/elevation) with Qwen image Edit 2511 and the Lora Multiple Angles","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2511-trainer","name":"Qwen Image Edit 2511 Trainer","created_by":"fal","source":"official","family":"qwen","description":"LoRA trainer for Qwen Image Edit 2511","status":"active","release_date":"2025-12-23","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-edit-2511-trainer","tagline":"LoRA trainer for Qwen Image Edit 2511","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-2511","name":"Qwen Image Edit 2511","created_by":"fal","source":"official","family":"qwen","description":"Endpoint for Qwen's Image Editing 2511 model.","status":"active","release_date":"2025-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-2511","tagline":"Endpoint for Qwen's Image Editing 2511 model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit/image-to-image","name":"Qwen Image Edit","created_by":"fal","source":"official","family":"qwen","description":"Image to Image Endpoint for Qwen's Image Editing model.","status":"active","release_date":"2025-09-30","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit/image-to-image","tagline":"Image to Image Endpoint for Qwen's Image Editing model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit/inpaint","name":"Qwen Image Edit","created_by":"fal","source":"official","family":"qwen","description":"Inpainting Endpoint for the Qwen Edit Image editing model.","status":"active","release_date":"2025-09-17","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit/inpaint","tagline":"Inpainting Endpoint for the Qwen Edit Image editing model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/qwen-image-edit-lora","name":"Qwen Image Edit Lora","created_by":"fal","source":"official","family":"qwen","description":"LoRA inference endpoint for the Qwen Image Editing model.","status":"active","release_date":"2025-09-10","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-lora","tagline":"LoRA inference endpoint for the Qwen Image Editing model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/add-background","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Add a realistic scene behind the object with white background","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/add-background","tagline":"Add a realistic scene behind the object with white background","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/face-to-full-portrait","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Generate full portrait from a cropped face photo","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/face-to-full-portrait","tagline":"Generate full portrait from a cropped face photo","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/group-photo","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Create group photos ","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/group-photo","tagline":"Create group photos ","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/integrate-product","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Blend products into backgrounds with automatic perspective and lighting correction","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/integrate-product","tagline":"Blend products into backgrounds with automatic perspective and lighting correction","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/lighting-restoration","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Removes harsh shadows and light spots from images, replacing them with soft, even, natural-looking illumination.","status":"active","release_date":"2025-12-12","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/lighting-restoration","tagline":"Removes harsh shadows and light spots from images, replacing them with soft, even, natural-looking illumination.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/multiple-angles","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Precise camera position and angle control (rotation, zoom, vertical movement)","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/multiple-angles","tagline":"Precise camera position and angle control (rotation, zoom, vertical movement)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/next-scene","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Create cinematic transitions and scene progressions (camera movements, framing changes)","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/next-scene","tagline":"Create cinematic transitions and scene progressions (camera movements, framing changes)","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/remove-element","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Remove unwanted elements (objects, people, text) while maintaining image consistency","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/remove-element","tagline":"Remove unwanted elements (objects, people, text) while maintaining image consistency","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/remove-lighting","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Remove existing lighting and apply soft, even illumination","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/remove-lighting","tagline":"Remove existing lighting and apply soft, even illumination","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora-gallery/shirt-design","name":"Qwen Image Edit Plus Lora Gallery","created_by":"fal","source":"official","family":"qwen","description":"Apply designs/graphics onto people's shirts","status":"active","release_date":"2025-11-11","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora-gallery/shirt-design","tagline":"Apply designs/graphics onto people's shirts","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-lora","name":"Qwen Image Edit Plus Lora","created_by":"fal","source":"official","family":"qwen","description":"LoRA endpoint for the Qwen Image Edit Plus model.","status":"active","release_date":"2025-10-03","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-lora","tagline":"LoRA endpoint for the Qwen Image Edit Plus model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus-trainer","name":"Qwen Image Edit Plus Trainer","created_by":"fal","source":"official","family":"qwen","description":"LoRA trainer for Qwen Image Edit Plus","status":"active","release_date":"2025-10-30","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus-trainer","tagline":"LoRA trainer for Qwen Image Edit Plus","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-plus","name":"Qwen Image Edit Plus","created_by":"fal","source":"official","family":"qwen","description":"Endpoint for Qwen's Image Editing Plus model also known as Qwen-Image-Edit-2509.","status":"active","release_date":"2025-09-22","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit-plus","tagline":"Endpoint for Qwen's Image Editing Plus model also known as Qwen-Image-Edit-2509.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit-trainer","name":"Qwen Image Edit Trainer","created_by":"fal","source":"official","family":"qwen","description":"LoRA trainer for Qwen Image Edit","status":"active","release_date":"2025-10-30","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-edit-trainer","tagline":"LoRA trainer for Qwen Image Edit","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-edit","name":"Qwen Image Edit","created_by":"fal","source":"official","family":"qwen","description":"Endpoint for Qwen's Image Editing model.","status":"active","release_date":"2025-08-18","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-edit","tagline":"Endpoint for Qwen's Image Editing model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/qwen-image/image-to-image","name":"Qwen Image","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image (Image-to-Image) transforms and edits input images with high fidelity, enabling precise style transfer, enhancement, and creative modification.","status":"active","release_date":"2025-08-25","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image/image-to-image","tagline":"Qwen-Image (Image-to-Image) transforms and edits input images with high fidelity, enabling precise style transfer, enhancement, and creative modification.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/qwen-image-layered/lora","name":"Qwen Image Layered","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image-Layered is a model capable of decomposing an image into multiple RGBA layers.","status":"active","release_date":"2025-12-24","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-layered/lora","tagline":"Qwen-Image-Layered is a model capable of decomposing an image into multiple RGBA layers.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-layered-trainer","name":"Qwen Image Layered Trainer","created_by":"fal","source":"official","family":"qwen","description":"Train LoRAs for the Qwen-Image-Layered model, customize how images are split into layers.","status":"active","release_date":"2025-12-23","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-layered-trainer","tagline":"Train LoRAs for the Qwen-Image-Layered model, customize how images are split into layers.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-layered","name":"Qwen Image Layered","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image-Layered is a model capable of decomposing an image into multiple RGBA layers.","status":"active","release_date":"2025-12-19","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-layered","tagline":"Qwen-Image-Layered is a model capable of decomposing an image into multiple RGBA layers.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-max/edit","name":"Qwen Image Max","created_by":"fal","source":"official","family":"qwen","description":"Image editing endpoint for Qwen-Image-Max.","status":"active","release_date":"2026-01-27","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-max/edit","tagline":"Image editing endpoint for Qwen-Image-Max.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-max/text-to-image","name":"Qwen Image Max","created_by":"fal","source":"official","family":"qwen","description":"Text-to-Image endpoint for Qwen-Image-Max.","status":"active","release_date":"2026-01-27","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image-max/text-to-image","tagline":"Text-to-Image endpoint for Qwen-Image-Max.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-trainer-v2","name":"Qwen Image Trainer V2","created_by":"fal","source":"official","family":"qwen","description":"Qwen Image LoRA training","status":"active","release_date":"2026-02-06","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-trainer-v2","tagline":"Qwen Image LoRA training","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image-trainer","name":"Qwen Image Trainer","created_by":"fal","source":"official","family":"qwen","description":"Qwen Image LoRA training","status":"active","release_date":"2025-08-14","model_type":"other","page_url":"https://fal.run/fal-ai/qwen-image-trainer","tagline":"Qwen Image LoRA training","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/qwen-image","name":"Qwen Image","created_by":"fal","source":"official","family":"qwen","description":"Qwen-Image is an image generation foundation model in the Qwen series that achieves significant advances in complex text rendering and precise image editing.","status":"active","release_date":"2025-08-04","model_type":"image","page_url":"https://fal.run/fal-ai/qwen-image","tagline":"Qwen-Image is an image generation foundation model in the Qwen series that achieves significant advances in complex text rendering and precise image editing.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/realistic-vision","name":"Realistic Vision","created_by":"fal","source":"official","description":"Generate realistic images.","status":"active","release_date":"2024-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/realistic-vision","tagline":"Generate realistic images.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/reconviagen-0.5","name":"ReconViaGen 0.5","created_by":"fal","source":"official","description":"Generate 3D models from one or more images using ReconViaGen 0.5","status":"active","release_date":"2026-04-07","model_type":"other","page_url":"https://fal.run/fal-ai/reconviagen-0.5","tagline":"Generate 3D models from one or more images using ReconViaGen 0.5","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/recraft-20b","name":"Recraft 20b","created_by":"fal","source":"official","description":"Recraft 20b is a new and affordable text-to-image model.","status":"active","release_date":"2024-12-16","model_type":"image","parameters":20,"page_url":"https://fal.run/fal-ai/recraft-20b","tagline":"Recraft 20b is a new and affordable text-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/upscale/creative","name":"Recraft Creative Upscale","created_by":"fal","source":"official","description":"Enhances a given raster image using the 'creative upscale' tool, increasing image resolution, making the image sharper and cleaner.","status":"active","release_date":"2025-05-07","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/upscale/creative","tagline":"Enhances a given raster image using the 'creative upscale' tool, increasing image resolution, making the image sharper and cleaner.","capabilities":{"vision":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"tools":["function_calling"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/upscale/crisp","name":"Recraft Crisp Upscale","created_by":"fal","source":"official","description":"Enhances a given raster image using 'crisp upscale' tool, boosting resolution with a focus on refining small details and faces.","status":"active","release_date":"2025-05-07","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/upscale/crisp","tagline":"Enhances a given raster image using 'crisp upscale' tool, boosting resolution with a focus on refining small details and faces.","capabilities":{"vision":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"tools":["function_calling"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v3/create-style","name":"Recraft V3 Create Style","created_by":"fal","source":"official","description":"Recraft V3 Create Style is capable of creating unique styles for Recraft V3 based on your images.","status":"active","release_date":"2025-05-07","model_type":"other","page_url":"https://fal.run/fal-ai/recraft/v3/create-style","tagline":"Recraft V3 Create Style is capable of creating unique styles for Recraft V3 based on your images.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v3/image-to-image","name":"Recraft V3","created_by":"fal","source":"official","description":"Recraft V3 is a text-to-image model with the ability to generate long texts, vector art, images in brand style, and much more.","status":"active","release_date":"2025-05-07","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v3/image-to-image","tagline":"Recraft V3 is a text-to-image model with the ability to generate long texts, vector art, images in brand style, and much more.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v3/text-to-image","name":"Recraft V3","created_by":"fal","source":"official","description":"Recraft V3 is a text-to-image model with the ability to generate long texts, vector art, images in brand style, and much more.","status":"active","release_date":"2025-05-07","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v3/text-to-image","tagline":"Recraft V3 is a text-to-image model with the ability to generate long texts, vector art, images in brand style, and much more.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v4/pro/text-to-image","name":"Recraft V4 Pro","created_by":"fal","source":"official","description":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","status":"active","release_date":"2026-02-12","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4/pro/text-to-image","tagline":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v4/pro/text-to-vector","name":"Recraft V4 Pro (Vector)","created_by":"fal","source":"official","description":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","status":"active","release_date":"2026-02-16","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4/pro/text-to-vector","tagline":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-03","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v4/text-to-image","name":"Recraft V4","created_by":"fal","source":"official","description":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","status":"active","release_date":"2026-02-12","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4/text-to-image","tagline":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v4/text-to-vector","name":"Recraft V4 (Vector)","created_by":"fal","source":"official","description":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","status":"active","release_date":"2026-02-16","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4/text-to-vector","tagline":"Recraft V4 was developed with designers to bring true visual taste to AI image generation.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-03","last_updated":"2026-05-11"},{"id":"fal-ai/recraft/v4.1/pro/text-to-image","name":"Recraft V4.1 Text to Image Pro","created_by":"fal","source":"official","description":"Recraft V4.1 Pro pushes the V4.1 model into high-resolution territory — up to 2048×2048 and ultra-wide formats.","status":"active","release_date":"2026-05-14","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4.1/pro/text-to-image","tagline":"Recraft V4.1 Pro pushes the V4.1 model into high-resolution territory — up to 2048×2048 and ultra-wide formats.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-14","last_updated":"2026-06-03"},{"id":"fal-ai/recraft/v4.1/pro/text-to-vector","name":"Recraft V4.1 Text to Vector Pro","created_by":"fal","source":"official","description":"Recraft V4.1 Pro Vector generates large-format, fully editable SVGs with the structural clarity professional illustrators expect.","status":"active","release_date":"2026-05-14","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4.1/pro/text-to-vector","tagline":"Recraft V4.1 Pro Vector generates large-format, fully editable SVGs with the structural clarity professional illustrators expect.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-14","last_updated":"2026-06-03"},{"id":"fal-ai/recraft/v4.1/text-to-image","name":"Recraft V4.1 Text to Image","created_by":"fal","source":"official","description":" Recraft V4.1 builds on the design-first foundation of V4 with sharper prompt control and cleaner composition.","status":"active","release_date":"2026-05-14","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4.1/text-to-image","tagline":" Recraft V4.1 builds on the design-first foundation of V4 with sharper prompt control and cleaner composition.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/recraft/v4.1/text-to-vector","name":"Recraft V4.1 Text to Vector","created_by":"fal","source":"official","description":"Recraft V4.1 Vector turns prompts into fully editable SVGs with structured layers and clean geometry.","status":"active","release_date":"2026-05-14","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4.1/text-to-vector","tagline":"Recraft V4.1 Vector turns prompts into fully editable SVGs with structured layers and clean geometry.","capabilities":{"vision":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-14","last_updated":"2026-06-03"},{"id":"fal-ai/recraft/v4.1/utility/pro/text-to-image","name":"Recraft V4.1 Utility Text to Image","created_by":"fal","source":"official","description":"Recraft V4.1 Utility Pro pairs the high-resolution output of V4.1 Pro with a faster, cost-efficient runtime.","status":"active","release_date":"2026-05-14","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4.1/utility/pro/text-to-image","tagline":"Recraft V4.1 Utility Pro pairs the high-resolution output of V4.1 Pro with a faster, cost-efficient runtime.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-14","last_updated":"2026-06-03"},{"id":"fal-ai/recraft/v4.1/utility/text-to-image","name":"Recraft V4.1 Text to Image Utility","created_by":"fal","source":"official","description":"Recraft V4.1 Utility is a faster, lighter variant of V4.1 made for high-volume creative workflows.","status":"active","release_date":"2026-05-14","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/v4.1/utility/text-to-image","tagline":"Recraft V4.1 Utility is a faster, lighter variant of V4.1 made for high-volume creative workflows.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-14","last_updated":"2026-06-03"},{"id":"fal-ai/recraft/vectorize","name":"Recraft","created_by":"fal","source":"official","description":"Converts a given raster image to SVG format using Recraft model.","status":"active","release_date":"2025-06-12","model_type":"image","page_url":"https://fal.run/fal-ai/recraft/vectorize","tagline":"Converts a given raster image to SVG format using Recraft model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/retoucher","name":"Face Retoucher","created_by":"fal","source":"official","description":"Automatically retouches faces to smooth skin and remove blemishes.","status":"active","release_date":"2024-02-13","model_type":"image","page_url":"https://fal.run/fal-ai/retoucher","tagline":"Automatically retouches faces to smooth skin and remove blemishes.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/rife/video","name":"RIFE","created_by":"fal","source":"official","description":"Interpolate videos with RIFE - Real-Time Intermediate Flow Estimation","status":"active","release_date":"2025-07-22","model_type":"other","page_url":"https://fal.run/fal-ai/rife/video","tagline":"Interpolate videos with RIFE - Real-Time Intermediate Flow Estimation","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/rife","name":"RIFE","created_by":"fal","source":"official","description":"Interpolate images with RIFE - Real-Time Intermediate Flow Estimation","status":"active","release_date":"2025-07-22","model_type":"image","page_url":"https://fal.run/fal-ai/rife","tagline":"Interpolate images with RIFE - Real-Time Intermediate Flow Estimation","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/sa2va/4b/image","name":"Sa2VA 4B Image","created_by":"fal","source":"official","description":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","status":"active","release_date":"2025-01-13","model_type":"other","page_url":"https://fal.run/fal-ai/sa2va/4b/image","tagline":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sa2va/4b/video","name":"Sa2VA 4B Video","created_by":"fal","source":"official","description":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","status":"active","release_date":"2025-01-13","model_type":"other","page_url":"https://fal.run/fal-ai/sa2va/4b/video","tagline":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sa2va/8b/image","name":"Sa2VA 8B Image","created_by":"fal","source":"official","description":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","status":"active","release_date":"2025-01-13","model_type":"other","page_url":"https://fal.run/fal-ai/sa2va/8b/image","tagline":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sa2va/8b/video","name":"Sa2VA 8B Video","created_by":"fal","source":"official","description":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","status":"active","release_date":"2025-01-13","model_type":"other","page_url":"https://fal.run/fal-ai/sa2va/8b/video","tagline":"Sa2VA is an MLLM capable of question answering, visual prompt understanding, and dense object segmentation at both image and video levels","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sadtalker/reference","name":"Sad Talker","created_by":"fal","source":"official","description":"Learning Realistic 3D Motion Coefficients for Stylized Audio-Driven Single Image Talking Face Animation","status":"active","release_date":"2024-12-20","model_type":"video","page_url":"https://fal.run/fal-ai/sadtalker/reference","tagline":"Learning Realistic 3D Motion Coefficients for Stylized Audio-Driven Single Image Talking Face Animation","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/sadtalker","name":"Sad Talker","created_by":"fal","source":"official","description":"Learning Realistic 3D Motion Coefficients for Stylized Audio-Driven Single Image Talking Face Animation","status":"active","release_date":"2024-04-11","model_type":"video","page_url":"https://fal.run/fal-ai/sadtalker","tagline":"Learning Realistic 3D Motion Coefficients for Stylized Audio-Driven Single Image Talking Face Animation","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3-1/image-rle","name":"Sam 3 1","created_by":"fal","source":"official","description":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","status":"active","release_date":"2026-03-30","model_type":"image","page_url":"https://fal.run/fal-ai/sam-3-1/image-rle","tagline":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3-1/image","name":"Sam 3 1","created_by":"fal","source":"official","description":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","status":"active","release_date":"2026-03-30","model_type":"image","page_url":"https://fal.run/fal-ai/sam-3-1/image","tagline":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3-1/video-rle","name":"Sam 3 1","created_by":"fal","source":"official","description":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","status":"active","release_date":"2026-03-30","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3-1/video-rle","tagline":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3-1/video","name":"Sam 3 1","created_by":"fal","source":"official","description":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","status":"active","release_date":"2026-03-30","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3-1/video","tagline":"SAM 3.1 builds comes with Object Multiplex, a shared-memory approach for joint multi-object tracking that delivers faster speeds with larger number of objects tracked.","last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/3d-align","name":"Sam 3","created_by":"fal","source":"official","description":"SAM 3D enables full scene reconstructions, placing objects and humans in a shared context together.","status":"active","release_date":"2025-12-02","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3/3d-align","tagline":"SAM 3D enables full scene reconstructions, placing objects and humans in a shared context together.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/3d-body","name":"Sam 3","created_by":"fal","source":"official","description":"SAM 3D allows for accurate 3D reconstruction of human body shape and position from a single image.","status":"active","release_date":"2025-12-02","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3/3d-body","tagline":"SAM 3D allows for accurate 3D reconstruction of human body shape and position from a single image.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/3d-objects","name":"Sam 3","created_by":"fal","source":"official","description":"SAM 3D enables precise 3D reconstruction of objects from real images, while accurately reconstructing their geometry and texture.","status":"active","release_date":"2025-12-02","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3/3d-objects","tagline":"SAM 3D enables precise 3D reconstruction of objects from real images, while accurately reconstructing their geometry and texture.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/image/embed","name":"Sam 3","created_by":"fal","source":"official","description":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","status":"active","release_date":"2025-11-20","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3/image/embed","tagline":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/image-rle","name":"Sam 3","created_by":"fal","source":"official","description":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","status":"active","release_date":"2025-11-20","model_type":"image","page_url":"https://fal.run/fal-ai/sam-3/image-rle","tagline":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/image","name":"Segment Anything Model 3","created_by":"fal","source":"official","description":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","status":"active","release_date":"2025-11-20","model_type":"image","page_url":"https://fal.run/fal-ai/sam-3/image","tagline":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/video-rle","name":"Sam 3","created_by":"fal","source":"official","description":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","status":"active","release_date":"2025-11-20","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3/video-rle","tagline":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-3/video","name":"Sam 3","created_by":"fal","source":"official","description":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","status":"active","release_date":"2025-11-20","model_type":"other","page_url":"https://fal.run/fal-ai/sam-3/video","tagline":"SAM 3 is a unified foundation model for promptable segmentation in images and videos.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-audio/separate","name":"Sam Audio","created_by":"fal","source":"official","description":"Audio separation with SAM Audio.","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/sam-audio/separate","tagline":"Audio separation with SAM Audio.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-audio/span-separate","name":"Sam Audio","created_by":"fal","source":"official","description":"Audio separation with SAM Audio.","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/sam-audio/span-separate","tagline":"Audio separation with SAM Audio.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam-audio/visual-separate","name":"Sam Audio","created_by":"fal","source":"official","description":"Audio separation with SAM Audio.","status":"active","release_date":"2025-12-30","model_type":"other","page_url":"https://fal.run/fal-ai/sam-audio/visual-separate","tagline":"Audio separation with SAM Audio.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam2/auto-segment","name":"Segment Anything Model 2","created_by":"fal","source":"official","description":"SAM 2 is a model for segmenting images automatically.","status":"active","release_date":"2025-02-25","model_type":"image","page_url":"https://fal.run/fal-ai/sam2/auto-segment","tagline":"SAM 2 is a model for segmenting images automatically.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam2/image","name":"Segment Anything Model 2","created_by":"fal","source":"official","description":"SAM 2 is a model for segmenting images and videos in real-time.","status":"active","release_date":"2024-08-15","model_type":"image","page_url":"https://fal.run/fal-ai/sam2/image","tagline":"SAM 2 is a model for segmenting images and videos in real-time.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sam2/video","name":"Segment Anything Model 2","created_by":"fal","source":"official","description":"SAM 2 is a model for segmenting images and videos in real-time.","status":"active","release_date":"2024-08-15","model_type":"other","page_url":"https://fal.run/fal-ai/sam2/video","tagline":"SAM 2 is a model for segmenting images and videos in real-time.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sana/sprint","name":"Sana Sprint","created_by":"fal","source":"official","description":"Sana Sprint is a text-to-image model capable of generating 4K images with exceptional speed.","status":"active","release_date":"2025-03-31","model_type":"image","page_url":"https://fal.run/fal-ai/sana/sprint","tagline":"Sana Sprint is a text-to-image model capable of generating 4K images with exceptional speed.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sana/v1.5/1.6b","name":"Sana v1.5 1.6B","created_by":"fal","source":"official","description":"Sana v1.5 1.6B is a lightweight text-to-image model that delivers 4K image generation with impressive efficiency.","status":"active","release_date":"2025-03-31","model_type":"image","page_url":"https://fal.run/fal-ai/sana/v1.5/1.6b","tagline":"Sana v1.5 1.6B is a lightweight text-to-image model that delivers 4K image generation with impressive efficiency.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sana/v1.5/4.8b","name":"Sana v1.5 4.8B","created_by":"fal","source":"official","description":"Sana v1.5 4.8B is a powerful text-to-image model that generates ultra-high quality 4K images with remarkable detail.","status":"active","release_date":"2025-03-31","model_type":"image","page_url":"https://fal.run/fal-ai/sana/v1.5/4.8b","tagline":"Sana v1.5 4.8B is a powerful text-to-image model that generates ultra-high quality 4K images with remarkable detail.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sana-video","name":"Sana Video","created_by":"fal","source":"official","description":"Leverage Sana's ultra-fast processing speed to generate high-quality assets that transform your text prompts into production-ready videos","status":"active","release_date":"2025-11-07","model_type":"video","page_url":"https://fal.run/fal-ai/sana-video","tagline":"Leverage Sana's ultra-fast processing speed to generate high-quality assets that transform your text prompts into production-ready videos","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/sana","name":"Sana","created_by":"fal","source":"official","description":"Sana can synthesize high-resolution, high-quality images with strong text-image alignment at a remarkably fast speed, with the ability to generate 4K images in less than a second.","status":"active","release_date":"2024-08-01","model_type":"image","page_url":"https://fal.run/fal-ai/sana","tagline":"Sana can synthesize high-resolution, high-quality images with strong text-image alignment at a remarkably fast speed, with the ability to generate 4K images in less than a second.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/scail-2","name":"Scail 2","created_by":"fal","source":"official","description":"SCAIL-2 is an end-to-end character animation model that drives a reference character from a source video without relying on intermediate pose representations like skeleton maps.","status":"active","release_date":"2026-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/scail-2","tagline":"SCAIL-2 is an end-to-end character animation model that drives a reference character from a source video without relying on intermediate pose representations like skeleton maps.","last_seen_at":"2026-06-18","last_updated":"2026-06-20"},{"id":"fal-ai/scail","name":"Scail","created_by":"fal","source":"official","description":"SCAIL is a character animation model that uses 3D consistent pose representations to animate reference images with coherent motion, supporting complex movements.","status":"active","release_date":"2025-12-17","model_type":"other","page_url":"https://fal.run/fal-ai/scail","tagline":"SCAIL is a character animation model that uses 3D consistent pose representations to animate reference images with coherent motion, supporting complex movements.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/scene-finder","name":"Scene Finder","created_by":"fal","source":"official","description":"Search any video with a text prompt - Scene Finder locates the matching moments and returns their time segments and extracted frames.","status":"active","release_date":"2026-06-03","model_type":"other","page_url":"https://fal.run/fal-ai/scene-finder","tagline":"Search any video with a text prompt - Scene Finder locates the matching moments and returns their time segments and extracted frames.","capabilities":{"vision":true},"last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/sd15-depth-controlnet","name":"SD 1.5 Depth ControlNet","created_by":"fal","source":"official","description":"SD 1.5 ControlNet","status":"active","release_date":"2024-05-31","model_type":"image","page_url":"https://fal.run/fal-ai/sd15-depth-controlnet","tagline":"SD 1.5 ControlNet","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/sdxl-controlnet-union/image-to-image","name":"SDXL ControlNet Union","created_by":"fal","source":"official","description":"An efficent SDXL multi-controlnet image-to-image model.","status":"active","release_date":"2024-07-31","model_type":"image","page_url":"https://fal.run/fal-ai/sdxl-controlnet-union/image-to-image","tagline":"An efficent SDXL multi-controlnet image-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/sdxl-controlnet-union/inpainting","name":"SDXL ControlNet Union","created_by":"fal","source":"official","description":"An efficent SDXL multi-controlnet inpainting model.","status":"active","release_date":"2024-07-31","model_type":"image","page_url":"https://fal.run/fal-ai/sdxl-controlnet-union/inpainting","tagline":"An efficent SDXL multi-controlnet inpainting model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/sdxl-controlnet-union","name":"SDXL ControlNet Union","created_by":"fal","source":"official","description":"An efficent SDXL multi-controlnet text-to-image model.","status":"active","release_date":"2024-07-31","model_type":"image","page_url":"https://fal.run/fal-ai/sdxl-controlnet-union","tagline":"An efficent SDXL multi-controlnet text-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/seedvr/upscale/image/seamless","name":"SeedVR2","created_by":"fal","source":"official","description":"Use SeedVR2 to upscale images, retaining seamless tiling","status":"active","release_date":"2026-03-23","model_type":"image","page_url":"https://fal.run/fal-ai/seedvr/upscale/image/seamless","tagline":"Use SeedVR2 to upscale images, retaining seamless tiling","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-26","last_updated":"2026-06-03"},{"id":"fal-ai/seedvr/upscale/image","name":"SeedVR2","created_by":"fal","source":"official","description":"Use SeedVR2 to upscale your images","status":"active","release_date":"2025-09-22","model_type":"image","page_url":"https://fal.run/fal-ai/seedvr/upscale/image","tagline":"Use SeedVR2 to upscale your images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-26","last_updated":"2026-06-03"},{"id":"fal-ai/seedvr/upscale/video","name":"SeedVR2","created_by":"fal","source":"official","description":"Upscale your videos using SeedVR2 with temporal consistency!","status":"active","release_date":"2025-09-22","model_type":"other","page_url":"https://fal.run/fal-ai/seedvr/upscale/video","tagline":"Upscale your videos using SeedVR2 with temporal consistency!","last_seen_at":"2026-05-26","last_updated":"2026-06-03"},{"id":"fal-ai/sensenova-u1-infographic","name":"Sensenova U1 Infographic","created_by":"fal","source":"official","description":"Generate Infographic Image with Sensenova U1","status":"active","release_date":"2026-06-17","model_type":"image","page_url":"https://fal.run/fal-ai/sensenova-u1-infographic","tagline":"Generate Infographic Image with Sensenova U1","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"fal-ai/silero-vad","name":"Silero VAD","created_by":"fal","source":"official","description":"Detect speech presence and timestamps with accuracy and speed using the ultra-lightweight Silero VAD model","status":"active","release_date":"2026-01-08","model_type":"transcription","page_url":"https://fal.run/fal-ai/silero-vad","tagline":"Detect speech presence and timestamps with accuracy and speed using the ultra-lightweight Silero VAD model","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/skyreels-i2v","name":"Skyreels V1 (Image-to-Video)","created_by":"fal","source":"official","description":"SkyReels V1 is the first and most advanced open-source human-centric video foundation model.","status":"active","release_date":"2025-02-18","model_type":"video","page_url":"https://fal.run/fal-ai/skyreels-i2v","tagline":"SkyReels V1 is the first and most advanced open-source human-centric video foundation model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/smart-resize","name":"Smart Resize","created_by":"fal","source":"official","description":" Smart image resize to arbitrary dimensions, powered by Nano Banana Pro with vision-LLM-guided prompting for composition-aware recomposition.","status":"active","release_date":"2026-04-28","model_type":"image","page_url":"https://fal.run/fal-ai/smart-resize","tagline":" Smart image resize to arbitrary dimensions, powered by Nano Banana Pro with vision-LLM-guided prompting for composition-aware recomposition.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"fal-ai/smart-turn","name":"Pipecat's Smart Turn model","created_by":"fal","source":"official","description":"An open source, community-driven and native audio turn detection model by Pipecat AI.","status":"active","release_date":"2025-04-21","model_type":"transcription","page_url":"https://fal.run/fal-ai/smart-turn","tagline":"An open source, community-driven and native audio turn detection model by Pipecat AI.","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/sora-2/characters","name":"Sora 2","created_by":"fal","source":"official","family":"sora-2","description":"Generate character ids to use with Sora 2 generations","status":"active","release_date":"2026-03-12","model_type":"video","page_url":"https://fal.run/fal-ai/sora-2/characters","tagline":"Generate character ids to use with Sora 2 generations","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-03-13","last_updated":"2026-05-11"},{"id":"fal-ai/sora-2/image-to-video/pro","name":"Sora 2","created_by":"fal","source":"official","family":"sora-2","description":"Image-to-video endpoint for Sora 2 Pro, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","status":"active","release_date":"2025-10-06","model_type":"video","page_url":"https://fal.run/fal-ai/sora-2/image-to-video/pro","tagline":"Image-to-video endpoint for Sora 2 Pro, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/sora-2/image-to-video","name":"Sora 2","created_by":"fal","source":"official","family":"sora-2","description":"Image-to-video endpoint for Sora 2, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","status":"active","release_date":"2025-10-06","model_type":"video","page_url":"https://fal.run/fal-ai/sora-2/image-to-video","tagline":"Image-to-video endpoint for Sora 2, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/sora-2/text-to-video/pro","name":"Sora 2","created_by":"fal","source":"official","family":"sora-2","description":"Text-to-video endpoint for Sora 2 Pro, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","status":"active","release_date":"2025-10-06","model_type":"video","page_url":"https://fal.run/fal-ai/sora-2/text-to-video/pro","tagline":"Text-to-video endpoint for Sora 2 Pro, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","capabilities":{"vision":true},"modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/sora-2/text-to-video","name":"Sora 2","created_by":"fal","source":"official","family":"sora-2","description":"Text-to-video endpoint for Sora 2, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","status":"active","release_date":"2025-10-06","model_type":"video","page_url":"https://fal.run/fal-ai/sora-2/text-to-video","tagline":"Text-to-video endpoint for Sora 2, OpenAI's state-of-the-art video model capable of creating richly detailed, dynamic clips with audio from natural language or images.","capabilities":{"vision":true},"modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/sora-2/video-to-video/remix","name":"Sora 2","created_by":"fal","source":"official","family":"sora-2","description":"Video-to-video remix endpoint for Sora 2, OpenAI’s advanced model that transforms existing videos based on new text or image prompts allowing rich edits, style changes, and creative reinterpretations ","status":"active","release_date":"2025-10-08","model_type":"other","page_url":"https://fal.run/fal-ai/sora-2/video-to-video/remix","tagline":"Video-to-video remix endpoint for Sora 2, OpenAI’s advanced model that transforms existing videos based on new text or image prompts allowing rich edits, style changes, and creative reinterpretations ","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/speech-to-text/stream","name":"Speech-To-text","created_by":"fal","source":"official","description":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","status":"active","release_date":"2025-04-04","model_type":"transcription","page_url":"https://fal.run/fal-ai/speech-to-text/stream","tagline":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/speech-to-text/turbo/stream","name":"Speech-to-Text","created_by":"fal","source":"official","description":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","status":"active","release_date":"2025-04-04","model_type":"transcription","page_url":"https://fal.run/fal-ai/speech-to-text/turbo/stream","tagline":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/speech-to-text/turbo","name":"Speech-to-Text","created_by":"fal","source":"official","description":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","status":"active","release_date":"2025-04-04","model_type":"transcription","page_url":"https://fal.run/fal-ai/speech-to-text/turbo","tagline":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/speech-to-text","name":"Speech-to-Text","created_by":"fal","source":"official","description":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","status":"active","release_date":"2025-04-04","model_type":"transcription","page_url":"https://fal.run/fal-ai/speech-to-text","tagline":"Leverage the rapid processing capabilities of AI models to enable accurate and efficient real-time speech-to-text transcription.","capabilities":{"streaming":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-audio-25/audio-to-audio","name":"Stable Audio 2.5","created_by":"fal","source":"official","description":"Generate high quality music and sound effects using Stable Audio 2.5 from StabilityAI","status":"active","release_date":"2025-09-10","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-25/audio-to-audio","tagline":"Generate high quality music and sound effects using Stable Audio 2.5 from StabilityAI","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/stable-audio-25/inpaint","name":"Stable Audio 25","created_by":"fal","source":"official","description":"Generate high quality music and sound effects using Stable Audio 2.5 from StabilityAI","status":"active","release_date":"2025-09-10","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-25/inpaint","tagline":"Generate high quality music and sound effects using Stable Audio 2.5 from StabilityAI","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/stable-audio-25/text-to-audio","name":"Stable Audio 2.5","created_by":"fal","source":"official","description":"Generate high quality music and sound effects using Stable Audio 2.5 from StabilityAI","status":"active","release_date":"2025-09-10","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-25/text-to-audio","tagline":"Generate high quality music and sound effects using Stable Audio 2.5 from StabilityAI","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/stable-audio-3/medium/audio-inpainting","name":"Stable Audio 3 Medium Audio Inpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Medium audio inpainting is a 1.4 billion parameter latent diffusion model that fills in or reworks selected segments of a stereo track guided by text prompts, supporting single- and mul","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/audio-inpainting","tagline":"Stable Audio 3 Medium audio inpainting is a 1.4 billion parameter latent diffusion model that fills in or reworks selected segments of a stereo track guided by text prompts, supporting single- and mul","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/medium/audio-outpainting","name":"Stable Audio 3 Medium Audio Outpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Medium audio outpainting is a 1.4 billion parameter latent diffusion model that extends existing stereo audio beyond its original endpoint via causal continuation guided by text prompts","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/audio-outpainting","tagline":"Stable Audio 3 Medium audio outpainting is a 1.4 billion parameter latent diffusion model that extends existing stereo audio beyond its original endpoint via causal continuation guided by text prompts","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/medium/audio-to-audio","name":"Stable Audio 3 Medium Audio to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Medium audio-to-audio is a 1.4 billion parameter latent diffusion model that transforms an input audio clip into new stereo variations up to 6 minutes guided by a text prompt.","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/audio-to-audio","tagline":"Stable Audio 3 Medium audio-to-audio is a 1.4 billion parameter latent diffusion model that transforms an input audio clip into new stereo variations up to 6 minutes guided by a text prompt.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/medium/base/audio-inpainting","name":"Stable Audio 3 Medium Base Audio Inpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Medium Base audio inpainting is the foundational 1.4 billion parameter checkpoint for editing or filling selected stereo audio segments guided by text prompts.","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/base/audio-inpainting","tagline":"Stable Audio 3 Medium Base audio inpainting is the foundational 1.4 billion parameter checkpoint for editing or filling selected stereo audio segments guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/medium/base/audio-outpainting","name":"Stable Audio 3 Medium Base Audio Outpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Medium Base audio outpainting is the foundational 1.4 billion parameter checkpoint that extends existing stereo audio with causal continuation guided by text prompts.","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/base/audio-outpainting","tagline":"Stable Audio 3 Medium Base audio outpainting is the foundational 1.4 billion parameter checkpoint that extends existing stereo audio with causal continuation guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/medium/base/audio-to-audio","name":"Stable Audio 3 Medium Base Audio to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Medium Base audio-to-audio is the foundational 1.4 billion parameter checkpoint that transforms input audio into new stereo variations up to 6 minutes guided by text prompts.","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/base/audio-to-audio","tagline":"Stable Audio 3 Medium Base audio-to-audio is the foundational 1.4 billion parameter checkpoint that transforms input audio into new stereo variations up to 6 minutes guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/medium/base/text-to-audio","name":"Stable Audio 3 Medium Base Text to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Medium Base is the foundational 1.4 billion parameter text-to-audio checkpoint generating stereo music up to 6 minutes, intended as the unmodified base for custom fine-tuning workflows.","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/base/text-to-audio","tagline":"Stable Audio 3 Medium Base is the foundational 1.4 billion parameter text-to-audio checkpoint generating stereo music up to 6 minutes, intended as the unmodified base for custom fine-tuning workflows.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/medium/text-to-audio","name":"Stable Audio 3","created_by":"fal","source":"official","description":"Stable Audio 3 Medium is a 1.4 billion parameter latent diffusion model that generates high-quality stereo music up to 6 minutes from text prompts, trained on fully licensed data for safe commercial u","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/medium/text-to-audio","tagline":"Stable Audio 3 Medium is a 1.4 billion parameter latent diffusion model that generates high-quality stereo music up to 6 minutes from text prompts, trained on fully licensed data for safe commercial u","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/audio-inpainting","name":"Stable Audio 3 Small Music Audio Inpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music audio inpainting is a 459 million parameter latent diffusion model that fills in or reworks selected segments of a music track guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/audio-inpainting","tagline":"Stable Audio 3 Small Music audio inpainting is a 459 million parameter latent diffusion model that fills in or reworks selected segments of a music track guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/audio-outpainting","name":"Stable Audio 3 Small Music Audio Outpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music audio outpainting is a 459 million parameter latent diffusion model that extends music compositions beyond their original endpoint via causal continuation.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/audio-outpainting","tagline":"Stable Audio 3 Small Music audio outpainting is a 459 million parameter latent diffusion model that extends music compositions beyond their original endpoint via causal continuation.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/audio-to-audio","name":"Stable Audio 3","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music audio-to-audio is a 459 million parameter latent diffusion model that transforms input music into new variations up to 2 minutes guided by text prompts.","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/audio-to-audio","tagline":"Stable Audio 3 Small Music audio-to-audio is a 459 million parameter latent diffusion model that transforms input music into new variations up to 2 minutes guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/base/audio-inpainting","name":"Stable Audio 3 Small Music Base Audio Inpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music Base audio inpainting is the foundational 459 million parameter checkpoint for editing or filling selected music segments guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/base/audio-inpainting","tagline":"Stable Audio 3 Small Music Base audio inpainting is the foundational 459 million parameter checkpoint for editing or filling selected music segments guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/base/audio-outpainting","name":"Stable Audio 3 Small Music Base Audio Outpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music Base audio outpainting is the foundational 459 million parameter checkpoint that extends music tracks via causal continuation guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/base/audio-outpainting","tagline":"Stable Audio 3 Small Music Base audio outpainting is the foundational 459 million parameter checkpoint that extends music tracks via causal continuation guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/base/audio-to-audio","name":"Stable Audio 3 Small Music Base Audio to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music Base audio-to-audio is the foundational 459 million parameter checkpoint that transforms input music into new variations up to 2 minutes guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/base/audio-to-audio","tagline":"Stable Audio 3 Small Music Base audio-to-audio is the foundational 459 million parameter checkpoint that transforms input music into new variations up to 2 minutes guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/base/text-to-audio","name":"Stable Audio 3","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music Base is the foundational 459 million parameter checkpoint generating full music compositions up to 2 minutes from text prompts, intended as the unmodified base for fine-tuni","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/base/text-to-audio","tagline":"Stable Audio 3 Small Music Base is the foundational 459 million parameter checkpoint generating full music compositions up to 2 minutes from text prompts, intended as the unmodified base for fine-tuni","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/music/text-to-audio","name":"Stable Audio 3 Small Music Text to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Small Music is a 459 million parameter latent diffusion model that generates full stereo music compositions up to 2 minutes from text prompts, lightweight enough for on-device deploymen","status":"active","release_date":"2026-05-22","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/music/text-to-audio","tagline":"Stable Audio 3 Small Music is a 459 million parameter latent diffusion model that generates full stereo music compositions up to 2 minutes from text prompts, lightweight enough for on-device deploymen","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/audio-inpainting","name":"Stable Audio 3 Small SFX Audio Inpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX audio inpainting is a 459 million parameter latent diffusion model that fills in or reworks selected segments of a sound-effect track guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/audio-inpainting","tagline":"Stable Audio 3 Small SFX audio inpainting is a 459 million parameter latent diffusion model that fills in or reworks selected segments of a sound-effect track guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/audio-outpainting","name":"Stable Audio 3 Small SFX Audio Outpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX audio outpainting is a 459 million parameter latent diffusion model that extends sound-effect tracks beyond their original endpoint via causal continuation.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/audio-outpainting","tagline":"Stable Audio 3 Small SFX audio outpainting is a 459 million parameter latent diffusion model that extends sound-effect tracks beyond their original endpoint via causal continuation.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/audio-to-audio","name":"Stable Audio 3","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX audio-to-audio is a 459 million parameter latent diffusion model that transforms input audio into new sound-effect variations guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/audio-to-audio","tagline":"Stable Audio 3 Small SFX audio-to-audio is a 459 million parameter latent diffusion model that transforms input audio into new sound-effect variations guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/base/audio-inpainting","name":"Stable Audio 3 Small SFX Base Audio Inpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX Base audio inpainting is the foundational 459 million parameter checkpoint for editing or filling selected sound-effect segments guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/base/audio-inpainting","tagline":"Stable Audio 3 Small SFX Base audio inpainting is the foundational 459 million parameter checkpoint for editing or filling selected sound-effect segments guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/base/audio-outpainting","name":"Stable Audio 3 Small SFX Base Audio Outpainting","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX Base audio outpainting is the foundational 459 million parameter checkpoint that extends sound-effect tracks via causal continuation guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/base/audio-outpainting","tagline":"Stable Audio 3 Small SFX Base audio outpainting is the foundational 459 million parameter checkpoint that extends sound-effect tracks via causal continuation guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/base/audio-to-audio","name":"Stable Audio 3 Small SFX Base Audio to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX Base audio-to-audio is the foundational 459 million parameter checkpoint that transforms input audio into new sound-effect variations guided by text prompts.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/base/audio-to-audio","tagline":"Stable Audio 3 Small SFX Base audio-to-audio is the foundational 459 million parameter checkpoint that transforms input audio into new sound-effect variations guided by text prompts.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/base/text-to-audio","name":"Stable Audio 3 Small SFX Base Text to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX Base is the foundational 459 million parameter checkpoint generating sound effects from text prompts, intended as the unmodified base for fine-tuning.","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/base/text-to-audio","tagline":"Stable Audio 3 Small SFX Base is the foundational 459 million parameter checkpoint generating sound effects from text prompts, intended as the unmodified base for fine-tuning.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3/small/sfx/text-to-audio","name":"Stable Audio 3 Small SFX Text to Audio","created_by":"fal","source":"official","description":"Stable Audio 3 Small SFX is a 459 million parameter latent diffusion model that generates high-quality sound effects from text prompts, designed for on-device deployment on mobile phones and consumer ","status":"active","release_date":"2026-05-25","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3/small/sfx/text-to-audio","tagline":"Stable Audio 3 Small SFX is a 459 million parameter latent diffusion model that generates high-quality sound effects from text prompts, designed for on-device deployment on mobile phones and consumer ","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"fal-ai/stable-audio-3-trainer","name":"Stable Audio 3 Trainer","created_by":"fal","source":"official","description":"Stable Audio 3 LoRA Trainer fine-tunes Stable Audio 3 base models on paired audio-caption datasets, producing compact LoRA weights that adapt generation toward a custom music style, sound palette, or ","status":"active","release_date":"2026-06-11","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio-3-trainer","tagline":"Stable Audio 3 LoRA Trainer fine-tunes Stable Audio 3 base models on paired audio-caption datasets, producing compact LoRA weights that adapt generation toward a custom music style, sound palette, or ","last_seen_at":"2026-06-14","last_updated":"2026-06-18"},{"id":"fal-ai/stable-audio","name":"Stable Audio Open","created_by":"fal","source":"official","description":"Open source text-to-audio model.","status":"active","release_date":"2024-01-04","model_type":"other","page_url":"https://fal.run/fal-ai/stable-audio","tagline":"Open source text-to-audio model.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/stable-avatar","name":"Stable Avatar","created_by":"fal","source":"official","description":"Stable Avatar generates audio-driven video avatars up to five minutes long","status":"active","release_date":"2025-08-14","model_type":"other","page_url":"https://fal.run/fal-ai/stable-avatar","tagline":"Stable Avatar generates audio-driven video avatars up to five minutes long","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-cascade/sote-diffusion","name":"SoteDiffusion","created_by":"fal","source":"official","description":"Anime finetune of Würstchen V3.","status":"active","release_date":"2024-06-10","model_type":"image","page_url":"https://fal.run/fal-ai/stable-cascade/sote-diffusion","tagline":"Anime finetune of Würstchen V3.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-cascade","name":"Stable Cascade","created_by":"fal","source":"official","description":"Stable Cascade: Image generation on a smaller & cheaper latent space.","status":"active","release_date":"2024-06-25","model_type":"image","page_url":"https://fal.run/fal-ai/stable-cascade","tagline":"Stable Cascade: Image generation on a smaller & cheaper latent space.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-diffusion-v15","name":"Stable Diffusion v1.5","created_by":"fal","source":"official","description":"Stable Diffusion v1.5","status":"active","release_date":"2024-04-16","model_type":"image","page_url":"https://fal.run/fal-ai/stable-diffusion-v15","tagline":"Stable Diffusion v1.5","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-diffusion-v3-medium/image-to-image","name":"Stable Diffusion V3","created_by":"fal","source":"official","description":"Stable Diffusion 3 Medium (Image to Image) is a Multimodal Diffusion Transformer (MMDiT) model that improves image quality, typography, prompt understanding, and efficiency.","status":"active","release_date":"2024-06-12","model_type":"image","page_url":"https://fal.run/fal-ai/stable-diffusion-v3-medium/image-to-image","tagline":"Stable Diffusion 3 Medium (Image to Image) is a Multimodal Diffusion Transformer (MMDiT) model that improves image quality, typography, prompt understanding, and efficiency.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-diffusion-v3-medium","name":"Stable Diffusion V3","created_by":"fal","source":"official","description":"Stable Diffusion 3 Medium (Text to Image) is a Multimodal Diffusion Transformer (MMDiT) model that improves image quality, typography, prompt understanding, and efficiency.","status":"active","release_date":"2024-08-20","model_type":"image","page_url":"https://fal.run/fal-ai/stable-diffusion-v3-medium","tagline":"Stable Diffusion 3 Medium (Text to Image) is a Multimodal Diffusion Transformer (MMDiT) model that improves image quality, typography, prompt understanding, and efficiency.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-diffusion-v35-large","name":"Stable Diffusion 3.5 Large","created_by":"fal","source":"official","description":"Stable Diffusion 3.5 Large is a Multimodal Diffusion Transformer (MMDiT) text-to-image model that features improved performance in image quality, typography, complex prompt understanding, and resource","status":"active","release_date":"2024-10-27","model_type":"image","page_url":"https://fal.run/fal-ai/stable-diffusion-v35-large","tagline":"Stable Diffusion 3.5 Large is a Multimodal Diffusion Transformer (MMDiT) text-to-image model that features improved performance in image quality, typography, complex prompt understanding, and resource","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/stable-diffusion-v35-medium","name":"Stable Diffusion 3.5 Medium","created_by":"fal","source":"official","description":"Stable Diffusion 3.5 Medium is a Multimodal Diffusion Transformer (MMDiT) text-to-image model that features improved performance in image quality, typography, complex prompt understanding, and resourc","status":"active","release_date":"2024-10-27","model_type":"image","page_url":"https://fal.run/fal-ai/stable-diffusion-v35-medium","tagline":"Stable Diffusion 3.5 Medium is a Multimodal Diffusion Transformer (MMDiT) text-to-image model that features improved performance in image quality, typography, complex prompt understanding, and resourc","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/stable-video","name":"High Quality Stable Video Diffusion","created_by":"fal","source":"official","description":"Generate short video clips from your images using SVD v1.1","status":"active","release_date":"2024-09-16","model_type":"video","page_url":"https://fal.run/fal-ai/stable-video","tagline":"Generate short video clips from your images using SVD v1.1","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/star-vector","name":"StarVector","created_by":"fal","source":"official","description":"AI vectorization model that transforms raster images into scalable SVG graphics, preserving visual details while enabling infinite scaling and easy editing capabilities.","status":"active","release_date":"2025-04-01","model_type":"image","page_url":"https://fal.run/fal-ai/star-vector","tagline":"AI vectorization model that transforms raster images into scalable SVG graphics, preserving visual details while enabling infinite scaling and easy editing capabilities.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/step1x-edit","name":"Step1X Edit","created_by":"fal","source":"official","description":"Step1X-Edit transforms your photos with simple instructions into stunning, professional-quality edits—rivaling top proprietary tools.","status":"active","release_date":"2025-04-25","model_type":"image","page_url":"https://fal.run/fal-ai/step1x-edit","tagline":"Step1X-Edit transforms your photos with simple instructions into stunning, professional-quality edits—rivaling top proprietary tools.","capabilities":{"vision":true,"tool_call":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"tools":["function_calling"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/stepx-edit2","name":"Stepx Edit2","created_by":"fal","source":"official","description":"Image-to-image editing with Step1X-Edit v2 from StepFun.","status":"active","release_date":"2025-12-09","model_type":"image","page_url":"https://fal.run/fal-ai/stepx-edit2","tagline":"Image-to-image editing with Step1X-Edit v2 from StepFun.","capabilities":{"vision":true,"reasoning":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/swin2sr","name":"SWIN2SR","created_by":"fal","source":"official","description":"Enhance low-resolution images with the superior quality of Swin2SR for sharper, clearer results.","status":"active","release_date":"2025-02-28","model_type":"image","page_url":"https://fal.run/fal-ai/swin2sr","tagline":"Enhance low-resolution images with the superior quality of Swin2SR for sharper, clearer results.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/switti/512","name":"Switti 512","created_by":"fal","source":"official","description":"Switti is a scale-wise transformer for fast text-to-image generation that outperforms existing T2I AR models and competes with state-of-the-art T2I diffusion models while being faster than distilled d","status":"active","release_date":"2024-12-31","model_type":"image","page_url":"https://fal.run/fal-ai/switti/512","tagline":"Switti is a scale-wise transformer for fast text-to-image generation that outperforms existing T2I AR models and competes with state-of-the-art T2I diffusion models while being faster than distilled d","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/switti","name":"Switti 1024","created_by":"fal","source":"official","description":"Switti is a scale-wise transformer for fast text-to-image generation that outperforms existing T2I AR models and competes with state-of-the-art T2I diffusion models while being faster than distilled d","status":"active","release_date":"2024-12-31","model_type":"image","page_url":"https://fal.run/fal-ai/switti","tagline":"Switti is a scale-wise transformer for fast text-to-image generation that outperforms existing T2I AR models and competes with state-of-the-art T2I diffusion models while being faster than distilled d","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/sync-lipsync/react-1","name":"Sync React-1","created_by":"fal","source":"official","description":"Use React-1 from SyncLabs to refine human emotions and do realistic lip-sync without losing details!","status":"active","release_date":"2025-12-10","model_type":"other","page_url":"https://fal.run/fal-ai/sync-lipsync/react-1","tagline":"Use React-1 from SyncLabs to refine human emotions and do realistic lip-sync without losing details!","last_seen_at":"2026-04-30","last_updated":"2026-05-11"},{"id":"fal-ai/sync-lipsync/v2/pro","name":"Sync Lipsync","created_by":"fal","source":"official","description":"Generate high-quality realistic lipsync animations from audio while preserving unique details like natural teeth and unique facial features using the state-of-the-art Sync Lipsync 2 Pro model.","status":"active","release_date":"2025-09-02","model_type":"other","page_url":"https://fal.run/fal-ai/sync-lipsync/v2/pro","tagline":"Generate high-quality realistic lipsync animations from audio while preserving unique details like natural teeth and unique facial features using the state-of-the-art Sync Lipsync 2 Pro model.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/sync-lipsync/v2","name":"Sync Lipsync 2.0","created_by":"fal","source":"official","description":"Generate realistic lipsync animations from audio using advanced algorithms for high-quality synchronization with Sync Lipsync 2.0 model","status":"active","release_date":"2025-04-01","model_type":"other","page_url":"https://fal.run/fal-ai/sync-lipsync/v2","tagline":"Generate realistic lipsync animations from audio using advanced algorithms for high-quality synchronization with Sync Lipsync 2.0 model","last_seen_at":"2026-06-26","last_updated":"2026-06-29"},{"id":"fal-ai/sync-lipsync/v3/image-to-video","name":"sync-3 Avatar Image to Video","created_by":"fal","source":"official","description":"sync-3 image to video turns a single still into a talking character, and works with any illustration or animated frame paired with a voice track","status":"active","release_date":"2026-06-22","model_type":"video","page_url":"https://fal.run/fal-ai/sync-lipsync/v3/image-to-video","tagline":"sync-3 image to video turns a single still into a talking character, and works with any illustration or animated frame paired with a voice track","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-23","last_updated":"2026-06-29"},{"id":"fal-ai/sync-lipsync/v3","name":"sync-3 Lipsync","created_by":"fal","source":"official","description":"sync-3 most powerful lipsync model yet, featuring native visual intelligence for professional-quality video.","status":"active","release_date":"2026-04-06","model_type":"other","page_url":"https://fal.run/fal-ai/sync-lipsync/v3","tagline":"sync-3 most powerful lipsync model yet, featuring native visual intelligence for professional-quality video.","last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/sync-lipsync","name":"sync.so -- lipsync 1.9.0-beta","created_by":"fal","source":"official","description":"Generate realistic lipsync animations from audio using advanced algorithms for high-quality synchronization.","status":"active","release_date":"2025-01-13","model_type":"other","page_url":"https://fal.run/fal-ai/sync-lipsync","tagline":"Generate realistic lipsync animations from audio using advanced algorithms for high-quality synchronization.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/t2v-turbo","name":"T2V Turbo - Video Crafter","created_by":"fal","source":"official","description":"Generate short video clips from your prompts","status":"active","release_date":"2024-03-08","model_type":"video","page_url":"https://fal.run/fal-ai/t2v-turbo","tagline":"Generate short video clips from your prompts","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/tada/1b/text-to-speech","name":"Tada TTS 1B","created_by":"fal","source":"official","description":"A unified speech-language model that synchronizes speech and text into a single, cohesive stream via 1:1 alignment.","status":"active","release_date":"2026-03-12","model_type":"other","page_url":"https://fal.run/fal-ai/tada/1b/text-to-speech","tagline":"A unified speech-language model that synchronizes speech and text into a single, cohesive stream via 1:1 alignment.","last_seen_at":"2026-03-12","last_updated":"2026-05-11"},{"id":"fal-ai/tada/3b/text-to-speech","name":"Tada","created_by":"fal","source":"official","description":"A unified speech-language model that synchronizes speech and text into a single, cohesive stream via 1:1 alignment.","status":"active","release_date":"2026-03-12","model_type":"other","page_url":"https://fal.run/fal-ai/tada/3b/text-to-speech","tagline":"A unified speech-language model that synchronizes speech and text into a single, cohesive stream via 1:1 alignment.","last_seen_at":"2026-03-12","last_updated":"2026-05-11"},{"id":"fal-ai/telestyle-v2","name":"Telestyle V2 Style Transfer","created_by":"fal","source":"official","description":"Restyle any image with TeleStyle v2 — provide an original image and a styling reference, and the model re-renders the original in the reference's visual style while preserving its content and composit","status":"active","release_date":"2026-06-22","model_type":"image","page_url":"https://fal.run/fal-ai/telestyle-v2","tagline":"Restyle any image with TeleStyle v2 — provide an original image and a styling reference, and the model re-renders the original in the reference's visual style while preserving its content and composit","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-22","last_updated":"2026-06-29"},{"id":"fal-ai/thera","name":"Thera","created_by":"fal","source":"official","description":"Fix low resolution images with fast speed and quality of thera.","status":"active","release_date":"2025-03-24","model_type":"image","page_url":"https://fal.run/fal-ai/thera","tagline":"Fix low resolution images with fast speed and quality of thera.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/thinksound/audio","name":"ThinkSound","created_by":"fal","source":"official","description":"Generate realistic audio from a video with an optional text prompt","status":"active","release_date":"2025-07-02","model_type":"other","page_url":"https://fal.run/fal-ai/thinksound/audio","tagline":"Generate realistic audio from a video with an optional text prompt","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/thinksound","name":"ThinkSound","created_by":"fal","source":"official","description":"Generate realistic audio for a video with an optional text prompt and combine","status":"active","release_date":"2025-07-01","model_type":"other","page_url":"https://fal.run/fal-ai/thinksound","tagline":"Generate realistic audio for a video with an optional text prompt and combine","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/topaz/upscale/image","name":"Topaz","created_by":"fal","source":"official","description":"Use the powerful and accurate topaz image enhancer to enhance your images.","status":"active","release_date":"2025-06-27","model_type":"image","page_url":"https://fal.run/fal-ai/topaz/upscale/image","tagline":"Use the powerful and accurate topaz image enhancer to enhance your images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-26","last_updated":"2026-06-03"},{"id":"fal-ai/topaz/upscale/video","name":"Topaz Video Upscale","created_by":"fal","source":"official","description":"Professional-grade video upscaling using Topaz technology.","status":"active","release_date":"2025-03-04","model_type":"other","page_url":"https://fal.run/fal-ai/topaz/upscale/video","tagline":"Professional-grade video upscaling using Topaz technology.","last_seen_at":"2026-06-29","last_updated":"2026-06-30"},{"id":"fal-ai/transpixar","name":"TransPixar V1","created_by":"fal","source":"official","description":"Transform text into stunning videos with TransPixar - an AI model that generates both RGB footage and alpha channels, enabling seamless compositing and creative video effects.","status":"active","release_date":"2025-01-14","model_type":"video","page_url":"https://fal.run/fal-ai/transpixar","tagline":"Transform text into stunning videos with TransPixar - an AI model that generates both RGB footage and alpha channels, enabling seamless compositing and creative video effects.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/trellis-2/retexture","name":"Trellis 2","created_by":"fal","source":"official","description":"Generate 3D models from your images using Trellis 2.","status":"active","release_date":"2026-03-02","model_type":"other","page_url":"https://fal.run/fal-ai/trellis-2/retexture","tagline":"Generate 3D models from your images using Trellis 2.","capabilities":{"vision":true},"last_seen_at":"2026-03-02","last_updated":"2026-05-11"},{"id":"fal-ai/trellis-2","name":"Trellis 2","created_by":"fal","source":"official","description":"Generate 3D models from your images using Trellis 2.","status":"active","release_date":"2025-12-17","model_type":"other","page_url":"https://fal.run/fal-ai/trellis-2","tagline":"Generate 3D models from your images using Trellis 2.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/trellis/multi","name":"Trellis","created_by":"fal","source":"official","description":"Generate 3D models from multiple images using Trellis.","status":"active","release_date":"2025-05-02","model_type":"other","page_url":"https://fal.run/fal-ai/trellis/multi","tagline":"Generate 3D models from multiple images using Trellis.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/trellis","name":"Trellis","created_by":"fal","source":"official","description":"Generate 3D models from your images using Trellis.","status":"active","release_date":"2024-12-13","model_type":"other","page_url":"https://fal.run/fal-ai/trellis","tagline":"Generate 3D models from your images using Trellis.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/triposr","name":"TripoSR","created_by":"fal","source":"official","description":"State of the art Image to 3D Object generation","status":"active","release_date":"2024-01-30","model_type":"other","page_url":"https://fal.run/fal-ai/triposr","tagline":"State of the art Image to 3D Object generation","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/turbo-flux-trainer","name":"Turbo Flux Trainer","created_by":"fal","source":"official","description":"A blazing fast FLUX dev LoRA trainer for subjects and styles.","status":"active","release_date":"2025-04-17","model_type":"other","page_url":"https://fal.run/fal-ai/turbo-flux-trainer","tagline":"A blazing fast FLUX dev LoRA trainer for subjects and styles.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/ultrashape","name":"Ultrashape","created_by":"fal","source":"official","description":"UltraShape-1.0 is a 3D diffusion framework that generates high-fidelity 3D geometry through coarse-to-fine geometric refinement.","status":"active","release_date":"2026-01-06","model_type":"other","page_url":"https://fal.run/fal-ai/ultrashape","tagline":"UltraShape-1.0 is a 3D diffusion framework that generates high-fidelity 3D geometry through coarse-to-fine geometric refinement.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/uno","name":"Uno","created_by":"fal","source":"official","description":"An AI model that transforms input images into new ones based on text prompts, blending reference visuals with your creative directions.","status":"active","release_date":"2025-04-24","model_type":"image","page_url":"https://fal.run/fal-ai/uno","tagline":"An AI model that transforms input images into new ones based on text prompts, blending reference visuals with your creative directions.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/uso","name":"Uso","created_by":"fal","source":"official","description":"Use USO to perform subject driven generations using reference image.","status":"active","release_date":"2025-08-30","model_type":"image","page_url":"https://fal.run/fal-ai/uso","tagline":"Use USO to perform subject driven generations using reference image.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/vecglypher/image-to-svg","name":"Vecglypher","created_by":"fal","source":"official","description":"Vector font generation with VecGlypher.","status":"active","release_date":"2026-03-10","model_type":"image","page_url":"https://fal.run/fal-ai/vecglypher/image-to-svg","tagline":"Vector font generation with VecGlypher.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-10","last_updated":"2026-05-11"},{"id":"fal-ai/vecglypher","name":"Vecglypher","created_by":"fal","source":"official","description":"Vector font generation with VecGlypher.","status":"active","release_date":"2026-03-10","model_type":"image","page_url":"https://fal.run/fal-ai/vecglypher","tagline":"Vector font generation with VecGlypher.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-03-10","last_updated":"2026-05-11"},{"id":"fal-ai/veo2/image-to-video","name":"Veo 2 (Image to Video)","created_by":"fal","source":"official","description":"Veo 2 creates videos from images with realistic motion and very high quality output.","status":"active","release_date":"2025-03-11","model_type":"video","page_url":"https://fal.run/fal-ai/veo2/image-to-video","tagline":"Veo 2 creates videos from images with realistic motion and very high quality output.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo2","name":"Veo 2","created_by":"fal","source":"official","description":"Veo 2 creates videos with realistic motion and high quality output.","status":"active","release_date":"2025-02-21","model_type":"video","page_url":"https://fal.run/fal-ai/veo2","tagline":"Veo 2 creates videos with realistic motion and high quality output.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3/fast/image-to-video","name":"Veo 3 Fast [Image to Video]","created_by":"fal","source":"official","description":"Now with a 50% price drop.","status":"active","release_date":"2025-07-09","model_type":"video","page_url":"https://fal.run/fal-ai/veo3/fast/image-to-video","tagline":"Now with a 50% price drop.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3/fast","name":"Veo 3 Fast","created_by":"fal","source":"official","description":"Faster and more cost effective version of Google's Veo 3! ","status":"active","release_date":"2025-07-09","model_type":"video","page_url":"https://fal.run/fal-ai/veo3/fast","tagline":"Faster and more cost effective version of Google's Veo 3! ","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3/image-to-video","name":"Veo3","created_by":"fal","source":"official","description":"Veo 3 is the latest state-of-the art video generation model from Google DeepMind","status":"active","release_date":"2025-08-01","model_type":"video","page_url":"https://fal.run/fal-ai/veo3/image-to-video","tagline":"Veo 3 is the latest state-of-the art video generation model from Google DeepMind","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/extend-video","name":"Veo 3.1","created_by":"fal","source":"official","description":"Extend Veo-Created Videos up to 30 seconds","status":"active","release_date":"2025-12-15","model_type":"other","page_url":"https://fal.run/fal-ai/veo3.1/extend-video","tagline":"Extend Veo-Created Videos up to 30 seconds","last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/fast/extend-video","name":"Veo 3.1 Fast","created_by":"fal","source":"official","description":"Extend Veo-Created Videos up to 30 seconds","status":"active","release_date":"2025-12-15","model_type":"other","page_url":"https://fal.run/fal-ai/veo3.1/fast/extend-video","tagline":"Extend Veo-Created Videos up to 30 seconds","last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/fast/first-last-frame-to-video","name":"Veo 3.1 Fast","created_by":"fal","source":"official","description":"Generate videos from a first/last frame using Google's Veo 3.1 Fast","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/fast/first-last-frame-to-video","tagline":"Generate videos from a first/last frame using Google's Veo 3.1 Fast","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/fast/image-to-video","name":"Veo 3.1 Fast","created_by":"fal","source":"official","description":"Generate videos from your image prompts using Veo 3.1 fast.","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/fast/image-to-video","tagline":"Generate videos from your image prompts using Veo 3.1 fast.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/fast/reference-to-video","name":"Veo 3.1 Fast","created_by":"fal","source":"official","description":"Generate videos from reference images using Google's Veo 3.1 Fast","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/fast/reference-to-video","tagline":"Generate videos from reference images using Google's Veo 3.1 Fast","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-05-11","last_updated":"2026-06-03"},{"id":"fal-ai/veo3.1/fast","name":"Veo 3.1 Fast","created_by":"fal","source":"official","description":"Faster and more cost effective version of Google's Veo 3.1! ","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/fast","tagline":"Faster and more cost effective version of Google's Veo 3.1! ","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/first-last-frame-to-video","name":"Veo 3.1","created_by":"fal","source":"official","description":"Generate videos from a first and last framed using Google's Veo 3.1","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/first-last-frame-to-video","tagline":"Generate videos from a first and last framed using Google's Veo 3.1","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/image-to-video","name":"Veo 3.1","created_by":"fal","source":"official","description":"Veo 3.1 is the latest state-of-the art video generation model from Google DeepMind","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/image-to-video","tagline":"Veo 3.1 is the latest state-of-the art video generation model from Google DeepMind","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/lite/first-last-frame-to-video","name":"Veo3.1 Lite FLF","created_by":"fal","source":"official","description":"Veo 3.1 Lite balances practical utility with professional capabilities, supporting Text-to-Video and Image-to-Video","status":"active","release_date":"2026-03-31","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/lite/first-last-frame-to-video","tagline":"Veo 3.1 Lite balances practical utility with professional capabilities, supporting Text-to-Video and Image-to-Video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/lite/image-to-video","name":"Veo3.1 Lite Image to Video","created_by":"fal","source":"official","description":"Veo 3.1 Lite balances practical utility with professional capabilities, supporting Text-to-Video and Image-to-Video","status":"active","release_date":"2026-03-31","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/lite/image-to-video","tagline":"Veo 3.1 Lite balances practical utility with professional capabilities, supporting Text-to-Video and Image-to-Video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/lite","name":"Veo3.1 Lite Text to Video","created_by":"fal","source":"official","description":"Veo 3.1 Lite balances practical utility with professional capabilities, supporting Text-to-Video and Image-to-Video","status":"active","release_date":"2026-03-31","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/lite","tagline":"Veo 3.1 Lite balances practical utility with professional capabilities, supporting Text-to-Video and Image-to-Video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1/reference-to-video","name":"Veo 3.1","created_by":"fal","source":"official","description":"Generate Videos from images using Google's Veo 3.1","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1/reference-to-video","tagline":"Generate Videos from images using Google's Veo 3.1","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3.1","name":"Veo 3.1","created_by":"fal","source":"official","description":"Veo 3.1 by Google, the most advanced AI video generation model in the world.","status":"active","release_date":"2025-10-08","model_type":"video","page_url":"https://fal.run/fal-ai/veo3.1","tagline":"Veo 3.1 by Google, the most advanced AI video generation model in the world.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/veo3","name":"Veo 3","created_by":"fal","source":"official","description":"Veo 3 by Google, the most advanced AI video generation model in the world.","status":"active","release_date":"2025-06-05","model_type":"video","page_url":"https://fal.run/fal-ai/veo3","tagline":"Veo 3 by Google, the most advanced AI video generation model in the world.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/vibevoice/0.5b","name":"Vibevoice","created_by":"fal","source":"official","description":"Generate long speech snippets fast using Microsoft's powerful TTS.","status":"active","release_date":"2025-12-17","model_type":"tts","page_url":"https://fal.run/fal-ai/vibevoice/0.5b","tagline":"Generate long speech snippets fast using Microsoft's powerful TTS.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/vibevoice/7b","name":"VibeVoice 7B","created_by":"fal","source":"official","description":"Generate long, expressive multi-voice speech using Microsoft's powerful TTS","status":"active","release_date":"2025-08-27","model_type":"tts","page_url":"https://fal.run/fal-ai/vibevoice/7b","tagline":"Generate long, expressive multi-voice speech using Microsoft's powerful TTS","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/vibevoice","name":"VibeVoice 1.5B","created_by":"fal","source":"official","description":"Generate long, expressive multi-voice speech using Microsoft's powerful TTS","status":"active","release_date":"2025-08-27","model_type":"tts","page_url":"https://fal.run/fal-ai/vibevoice","tagline":"Generate long, expressive multi-voice speech using Microsoft's powerful TTS","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/video-as-prompt","name":"Video As Prompt","created_by":"fal","source":"official","description":"A model for unified semantic control in video generation.","status":"active","release_date":"2025-10-29","model_type":"other","page_url":"https://fal.run/fal-ai/video-as-prompt","tagline":"A model for unified semantic control in video generation.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/video-prompt-generator","name":"Video Prompt Generator","created_by":"fal","source":"official","description":"Generate video prompts using a variety of techniques including camera direction, style, pacing, special effects and more.","status":"active","release_date":"2025-02-25","model_type":"other","page_url":"https://fal.run/fal-ai/video-prompt-generator","tagline":"Generate video prompts using a variety of techniques including camera direction, style, pacing, special effects and more.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/video-understanding","name":"Video Understanding","created_by":"fal","source":"official","description":"A video understanding model to analyze video content and answer questions about what's happening in the video based on user prompts.","status":"active","release_date":"2025-06-20","model_type":"other","page_url":"https://fal.run/fal-ai/video-understanding","tagline":"A video understanding model to analyze video content and answer questions about what's happening in the video based on user prompts.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/video-upscaler","name":"Video Upscaler","created_by":"fal","source":"official","description":"The video upscaler endpoint uses RealESRGAN on each frame of the input video to upscale the video to a higher resolution.","status":"active","release_date":"2024-12-04","model_type":"other","page_url":"https://fal.run/fal-ai/video-upscaler","tagline":"The video upscaler endpoint uses RealESRGAN on each frame of the input video to upscale the video to a higher resolution.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/image-to-video","name":"Vidu Image to Video","created_by":"fal","source":"official","description":"Vidu Image to Video generates high-quality videos with exceptional visual quality and motion diversity from a single image","status":"active","release_date":"2025-03-12","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/image-to-video","tagline":"Vidu Image to Video generates high-quality videos with exceptional visual quality and motion diversity from a single image","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q1/image-to-video","name":"Vidu Image to Video","created_by":"fal","source":"official","description":"Vidu Q1 Image to Video generates high-quality 1080p videos with exceptional visual quality and motion diversity from a single image","status":"active","release_date":"2025-05-09","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q1/image-to-video","tagline":"Vidu Q1 Image to Video generates high-quality 1080p videos with exceptional visual quality and motion diversity from a single image","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q1/reference-to-video","name":"Vidu","created_by":"fal","source":"official","description":"Generate video clips from your multiple image references using Vidu Q1","status":"active","release_date":"2025-07-08","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q1/reference-to-video","tagline":"Generate video clips from your multiple image references using Vidu Q1","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q1/start-end-to-video","name":"Vidu Start End to Video","created_by":"fal","source":"official","description":"Vidu Q1 Start-End to Video generates smooth transition 1080p videos between specified start and end images.","status":"active","release_date":"2025-05-09","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q1/start-end-to-video","tagline":"Vidu Q1 Start-End to Video generates smooth transition 1080p videos between specified start and end images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q1/text-to-video","name":"Vidu Text to Video","created_by":"fal","source":"official","description":"Vidu Q1 Text to Video generates high-quality 1080p videos with exceptional visual quality and motion diversity","status":"active","release_date":"2025-05-09","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q1/text-to-video","tagline":"Vidu Q1 Text to Video generates high-quality 1080p videos with exceptional visual quality and motion diversity","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q2/image-to-video/pro","name":"Vidu","created_by":"fal","source":"official","description":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","status":"active","release_date":"2025-10-24","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q2/image-to-video/pro","tagline":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q2/image-to-video/turbo","name":"Vidu","created_by":"fal","source":"official","description":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","status":"active","release_date":"2025-10-24","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q2/image-to-video/turbo","tagline":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q2/reference-to-image","name":"Vidu","created_by":"fal","source":"official","description":"Vidu Reference-to-Image creates images by using a reference images and combining them with a prompt.","status":"active","release_date":"2025-12-02","model_type":"image","page_url":"https://fal.run/fal-ai/vidu/q2/reference-to-image","tagline":"Vidu Reference-to-Image creates images by using a reference images and combining them with a prompt.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q2/reference-to-video/pro","name":"Vidu","created_by":"fal","source":"official","description":"Use the latest Vidu Q2 Pro models which much more better quality and control on your videos.","status":"active","release_date":"2026-01-19","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q2/reference-to-video/pro","tagline":"Use the latest Vidu Q2 Pro models which much more better quality and control on your videos.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q2/text-to-image","name":"Vidu","created_by":"fal","source":"official","description":"Use vidu Text-to-Image to turn your prompts into reality.","status":"active","release_date":"2025-12-02","model_type":"image","page_url":"https://fal.run/fal-ai/vidu/q2/text-to-image","tagline":"Use vidu Text-to-Image to turn your prompts into reality.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q2/text-to-video","name":"Vidu","created_by":"fal","source":"official","description":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","status":"active","release_date":"2025-10-22","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q2/text-to-video","tagline":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q2/video-extension/pro","name":"Vidu","created_by":"fal","source":"official","description":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","status":"active","release_date":"2025-10-24","model_type":"other","page_url":"https://fal.run/fal-ai/vidu/q2/video-extension/pro","tagline":"Use the latest Vidu Q2 models which much more better quality and control on your videos.","last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q3/image-to-video/turbo","name":"Vidu","created_by":"fal","source":"official","description":"Vidu's Q3 Turbo Model","status":"active","release_date":"2026-02-06","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q3/image-to-video/turbo","tagline":"Vidu's Q3 Turbo Model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q3/image-to-video","name":"Vidu","created_by":"fal","source":"official","description":"Vidu's latest Q3 pro models.","status":"active","release_date":"2026-01-31","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q3/image-to-video","tagline":"Vidu's latest Q3 pro models.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q3/reference-to-video/mix","name":"Vidu","created_by":"fal","source":"official","description":"Vidu's latest Q3 Reference to Video Mix model","status":"active","release_date":"2026-04-08","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q3/reference-to-video/mix","tagline":"Vidu's latest Q3 Reference to Video Mix model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q3/text-to-video/turbo","name":"Vidu","created_by":"fal","source":"official","description":"Vidu's Q3 Turbo Model.","status":"active","release_date":"2026-02-06","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q3/text-to-video/turbo","tagline":"Vidu's Q3 Turbo Model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/q3/text-to-video","name":"Vidu","created_by":"fal","source":"official","description":"Vidu's latest Q3 pro models","status":"active","release_date":"2026-01-31","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/q3/text-to-video","tagline":"Vidu's latest Q3 pro models","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/reference-to-image","name":"Vidu","created_by":"fal","source":"official","description":"Vidu Reference-to-Image creates images by using a reference images and combining them with a prompt.","status":"active","release_date":"2025-09-09","model_type":"image","page_url":"https://fal.run/fal-ai/vidu/reference-to-image","tagline":"Vidu Reference-to-Image creates images by using a reference images and combining them with a prompt.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/reference-to-video","name":"Vidu Reference to Video","created_by":"fal","source":"official","description":"Vidu Reference to Video creates videos by using a reference images and combining them with a prompt.","status":"active","release_date":"2025-03-12","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/reference-to-video","tagline":"Vidu Reference to Video creates videos by using a reference images and combining them with a prompt.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/start-end-to-video","name":"Vidu Start-End to Video","created_by":"fal","source":"official","description":"Vidu Start-End to Video generates smooth transition videos between specified start and end images.","status":"active","release_date":"2025-03-12","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/start-end-to-video","tagline":"Vidu Start-End to Video generates smooth transition videos between specified start and end images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/vidu/template-to-video","name":"Vidu Template to Video","created_by":"fal","source":"official","description":"Vidu Template to Video lets you create different effects by applying motion templates to your images.","status":"active","release_date":"2025-03-12","model_type":"video","page_url":"https://fal.run/fal-ai/vidu/template-to-video","tagline":"Vidu Template to Video lets you create different effects by applying motion templates to your images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/void-video-inpainting","name":"Void Video Inpainting","created_by":"fal","source":"official","description":"VOID removes objects from videos along with all interactions they induce on the scene","status":"active","release_date":"2026-04-10","model_type":"other","page_url":"https://fal.run/fal-ai/void-video-inpainting","tagline":"VOID removes objects from videos along with all interactions they induce on the scene","last_seen_at":"2026-04-28","last_updated":"2026-05-11"},{"id":"fal-ai/wan-22-image-trainer","name":"Wan 2.2 14B Image Trainer","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2 text to image LoRA trainer.","status":"active","release_date":"2025-08-11","model_type":"other","page_url":"https://fal.run/fal-ai/wan-22-image-trainer","tagline":"Wan 2.2 text to image LoRA trainer.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-22-trainer/i2v-a14b","name":"Wan-2.2 LoRA Trainer","created_by":"fal","source":"official","family":"wan","description":"Train custom LoRAs for Wan-2.2 T2V/I2V 480P","status":"active","release_date":"2026-02-23","model_type":"other","page_url":"https://fal.run/fal-ai/wan-22-trainer/i2v-a14b","tagline":"Train custom LoRAs for Wan-2.2 T2V/I2V 480P","last_seen_at":"2026-02-25","last_updated":"2026-05-11"},{"id":"fal-ai/wan-22-trainer/t2v-a14b","name":"Wan-2.2 LoRA Trainer","created_by":"fal","source":"official","family":"wan","description":"Train custom LoRAs for Wan-2.2 T2V/I2V 480P","status":"active","release_date":"2026-02-23","model_type":"other","page_url":"https://fal.run/fal-ai/wan-22-trainer/t2v-a14b","tagline":"Train custom LoRAs for Wan-2.2 T2V/I2V 480P","last_seen_at":"2026-02-25","last_updated":"2026-05-11"},{"id":"fal-ai/wan-22-vace-fun-a14b/depth","name":"Wan 2.2 VACE Fun A14B","created_by":"fal","source":"official","family":"wan","description":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","status":"active","release_date":"2025-09-17","model_type":"other","page_url":"https://fal.run/fal-ai/wan-22-vace-fun-a14b/depth","tagline":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-22-vace-fun-a14b/inpainting","name":"Wan 2.2 VACE Fun A14B","created_by":"fal","source":"official","family":"wan","description":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","status":"active","release_date":"2025-09-17","model_type":"other","page_url":"https://fal.run/fal-ai/wan-22-vace-fun-a14b/inpainting","tagline":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-22-vace-fun-a14b/outpainting","name":"Wan 2.2 VACE Fun A14B","created_by":"fal","source":"official","family":"wan","description":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","status":"active","release_date":"2025-09-17","model_type":"other","page_url":"https://fal.run/fal-ai/wan-22-vace-fun-a14b/outpainting","tagline":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-22-vace-fun-a14b/reframe","name":"Wan 2.2 VACE Fun A14B","created_by":"fal","source":"official","family":"wan","description":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","status":"active","release_date":"2025-09-17","model_type":"other","page_url":"https://fal.run/fal-ai/wan-22-vace-fun-a14b/reframe","tagline":"VACE Fun for Wan 2.2 A14B from Alibaba-PAI","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-25-preview/image-to-image","name":"Wan 2.5 Image to Image","created_by":"fal","source":"official","family":"wan","description":"Wan 2.5 image-to-image model.","status":"active","release_date":"2025-09-25","model_type":"image","page_url":"https://fal.run/fal-ai/wan-25-preview/image-to-image","tagline":"Wan 2.5 image-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan-25-preview/image-to-video","name":"Wan 2.5 Image to Video","created_by":"fal","source":"official","family":"wan","description":"Wan 2.5 image-to-video model.","status":"active","release_date":"2025-09-24","model_type":"video","page_url":"https://fal.run/fal-ai/wan-25-preview/image-to-video","tagline":"Wan 2.5 image-to-video model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan-25-preview/text-to-image","name":"Wan 2.5 Text to Image","created_by":"fal","source":"official","family":"wan","description":"Wan 2.5 text-to-image model.","status":"active","release_date":"2025-09-25","model_type":"image","page_url":"https://fal.run/fal-ai/wan-25-preview/text-to-image","tagline":"Wan 2.5 text-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan-25-preview/text-to-video","name":"Wan 2.5 Text to Video","created_by":"fal","source":"official","family":"wan","description":"Wan 2.5 text-to-video model.","status":"active","release_date":"2025-09-24","model_type":"video","page_url":"https://fal.run/fal-ai/wan-25-preview/text-to-video","tagline":"Wan 2.5 text-to-video model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-27","last_updated":"2026-05-11"},{"id":"fal-ai/wan-alpha","name":"Wan Alpha","created_by":"fal","source":"official","family":"wan","description":"Generate videos with transparent backgrounds","status":"active","release_date":"2025-10-16","model_type":"video","page_url":"https://fal.run/fal-ai/wan-alpha","tagline":"Generate videos with transparent backgrounds","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-ati","name":"Wan Ati","created_by":"fal","source":"official","family":"wan","description":"WAN-ATI is a controllable video generation model that uses trajectory instructions to guide object, local, and camera motion, enabling precise and flexible image-to-video creation.","status":"active","release_date":"2025-08-29","model_type":"video","page_url":"https://fal.run/fal-ai/wan-ati","tagline":"WAN-ATI is a controllable video generation model that uses trajectory instructions to guide object, local, and camera motion, enabling precise and flexible image-to-video creation.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-effects","name":"Wan Effects","created_by":"fal","source":"official","family":"wan","description":"Wan Effects generates high-quality videos with popular effects from images","status":"active","release_date":"2025-03-13","model_type":"video","page_url":"https://fal.run/fal-ai/wan-effects","tagline":"Wan Effects generates high-quality videos with popular effects from images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-flf2v","name":"Wan-2.1 First-Last-Frame-to-Video","created_by":"fal","source":"official","family":"wan","description":"Wan-2.1 flf2v generates dynamic videos by intelligently bridging a given first frame to a desired end frame through smooth, coherent motion sequences.","status":"active","release_date":"2025-04-17","model_type":"video","page_url":"https://fal.run/fal-ai/wan-flf2v","tagline":"Wan-2.1 flf2v generates dynamic videos by intelligently bridging a given first frame to a desired end frame through smooth, coherent motion sequences.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-fun-control","name":"Wan 2.2 Fun Control","created_by":"fal","source":"official","family":"wan","description":"Generate pose or depth controlled video using Alibaba-PAI's Wan 2.2 Fun","status":"active","release_date":"2025-08-28","model_type":"other","page_url":"https://fal.run/fal-ai/wan-fun-control","tagline":"Generate pose or depth controlled video using Alibaba-PAI's Wan 2.2 Fun","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-i2v-lora","name":"Wan-2.1 Image-to-Video with LoRAs","created_by":"fal","source":"official","family":"wan","description":"Add custom LoRAs to Wan-2.1 is a image-to-video model that generates high-quality videos with high visual quality and motion diversity from images","status":"active","release_date":"2025-03-08","model_type":"video","page_url":"https://fal.run/fal-ai/wan-i2v-lora","tagline":"Add custom LoRAs to Wan-2.1 is a image-to-video model that generates high-quality videos with high visual quality and motion diversity from images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-i2v","name":"Wan-2.1 Image-to-Video","created_by":"fal","source":"official","family":"wan","description":"Wan-2.1 is a image-to-video model that generates high-quality videos with high visual quality and motion diversity from images","status":"active","release_date":"2025-02-25","model_type":"video","page_url":"https://fal.run/fal-ai/wan-i2v","tagline":"Wan-2.1 is a image-to-video model that generates high-quality videos with high visual quality and motion diversity from images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-motion","name":"Wan Motion","created_by":"fal","source":"official","family":"wan","description":"Wan Motion is a streamlined character animation model that transfers motion from a driving video onto a reference character image.","status":"active","release_date":"2026-02-19","model_type":"other","page_url":"https://fal.run/fal-ai/wan-motion","tagline":"Wan Motion is a streamlined character animation model that transfers motion from a driving video onto a reference character image.","capabilities":{"vision":true},"last_seen_at":"2026-02-23","last_updated":"2026-05-11"},{"id":"fal-ai/wan-move","name":"Wan Move [480p]","created_by":"fal","source":"official","family":"wan","description":"Use Wan-Move to generate videos with controlled the motion using trajectories","status":"active","release_date":"2025-12-24","model_type":"video","page_url":"https://fal.run/fal-ai/wan-move","tagline":"Use Wan-Move to generate videos with controlled the motion using trajectories","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-pro/image-to-video","name":"Wan-2.1 Pro Image-to-Video","created_by":"fal","source":"official","family":"wan","description":"Wan-2.1 Pro is a premium image-to-video model that generates high-quality 1080p videos at 30fps with up to 6 seconds duration, delivering exceptional visual quality and motion diversity from images","status":"active","release_date":"2025-03-11","model_type":"video","page_url":"https://fal.run/fal-ai/wan-pro/image-to-video","tagline":"Wan-2.1 Pro is a premium image-to-video model that generates high-quality 1080p videos at 30fps with up to 6 seconds duration, delivering exceptional visual quality and motion diversity from images","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan-pro/text-to-video","name":"Wan-2.1 Pro Text-to-Video","created_by":"fal","source":"official","family":"wan","description":"Wan-2.1 Pro is a premium text-to-video model that generates high-quality 1080p videos at 30fps with up to 6 seconds duration, delivering exceptional visual quality and motion diversity from text promp","status":"active","release_date":"2025-03-11","model_type":"video","page_url":"https://fal.run/fal-ai/wan-pro/text-to-video","tagline":"Wan-2.1 Pro is a premium text-to-video model that generates high-quality 1080p videos at 30fps with up to 6 seconds duration, delivering exceptional visual quality and motion diversity from text promp","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan-t2v-lora","name":"Wan-2.1 Text-to-Video with LoRAs","created_by":"fal","source":"official","family":"wan","description":"Add custom LoRAs to Wan-2.1 is a text-to-video model that generates high-quality videos with high visual quality and motion diversity from images","status":"active","release_date":"2025-03-25","model_type":"video","page_url":"https://fal.run/fal-ai/wan-t2v-lora","tagline":"Add custom LoRAs to Wan-2.1 is a text-to-video model that generates high-quality videos with high visual quality and motion diversity from images","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-t2v","name":"Wan-2.1 Text-to-Video","created_by":"fal","source":"official","family":"wan","description":"Wan-2.1 is a text-to-video model that generates high-quality videos with high visual quality and motion diversity from text prompts","status":"active","release_date":"2025-02-25","model_type":"video","page_url":"https://fal.run/fal-ai/wan-t2v","tagline":"Wan-2.1 is a text-to-video model that generates high-quality videos with high visual quality and motion diversity from text prompts","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-trainer/flf2v-720p","name":"Wan-2.1 LoRA Trainer","created_by":"fal","source":"official","family":"wan","description":"Train custom LoRAs for Wan-2.1 FLF2V 720P","status":"active","release_date":"2025-06-11","model_type":"other","page_url":"https://fal.run/fal-ai/wan-trainer/flf2v-720p","tagline":"Train custom LoRAs for Wan-2.1 FLF2V 720P","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-trainer/i2v-720p","name":"Wan-2.1 LoRA Trainer","created_by":"fal","source":"official","family":"wan","description":"Train custom LoRAs for Wan-2.1 I2V 720P","status":"active","release_date":"2025-06-11","model_type":"other","page_url":"https://fal.run/fal-ai/wan-trainer/i2v-720p","tagline":"Train custom LoRAs for Wan-2.1 I2V 720P","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-trainer/t2v-14b","name":"Wan-2.1 LoRA Trainer","created_by":"fal","source":"official","family":"wan","description":"Train custom LoRAs for Wan-2.1 T2V 14B","status":"active","release_date":"2025-06-11","model_type":"other","parameters":14,"page_url":"https://fal.run/fal-ai/wan-trainer/t2v-14b","tagline":"Train custom LoRAs for Wan-2.1 T2V 14B","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-trainer/t2v","name":"Wan-2.1 LoRA Trainer","created_by":"fal","source":"official","family":"wan","description":"Train custom LoRAs for Wan-2.1 T2V 1.3B","status":"active","release_date":"2025-06-11","model_type":"other","page_url":"https://fal.run/fal-ai/wan-trainer/t2v","tagline":"Train custom LoRAs for Wan-2.1 T2V 1.3B","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan-trainer","name":"Wan-2.1 LoRA Trainer","created_by":"fal","source":"official","family":"wan","description":"Train custom LoRAs for Wan-2.1 I2V 480P","status":"active","release_date":"2025-03-24","model_type":"other","page_url":"https://fal.run/fal-ai/wan-trainer","tagline":"Train custom LoRAs for Wan-2.1 I2V 480P","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.1/1.3b/text-to-video","name":"Wan-2.1 1.3B Text-to-Video","created_by":"fal","source":"official","family":"wan","description":"Wan-2.1 1.3B is a text-to-video model that generates high-quality videos with high visual quality and motion diversity from text promptsat faster speeds.","status":"active","release_date":"2025-02-27","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.1/1.3b/text-to-video","tagline":"Wan-2.1 1.3B is a text-to-video model that generates high-quality videos with high visual quality and motion diversity from text promptsat faster speeds.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-14b/animate/move","name":"Wan-2.2 Animate Move","created_by":"fal","source":"official","family":"wan","description":"Wan-Animate is a video model that generates high-fidelity character videos by replicating the expressions and movements of characters from reference videos.","status":"active","release_date":"2025-09-21","model_type":"other","page_url":"https://fal.run/fal-ai/wan/v2.2-14b/animate/move","tagline":"Wan-Animate is a video model that generates high-fidelity character videos by replicating the expressions and movements of characters from reference videos.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-14b/animate/replace","name":"Wan-2.2 Animate Replace","created_by":"fal","source":"official","family":"wan","description":"Wan-Animate Replace is a model that can integrate animated characters into reference videos, replacing the original character while preserving the scene’s lighting and color tone for seamless environm","status":"active","release_date":"2025-09-21","model_type":"other","page_url":"https://fal.run/fal-ai/wan/v2.2-14b/animate/replace","tagline":"Wan-Animate Replace is a model that can integrate animated characters into reference videos, replacing the original character while preserving the scene’s lighting and color tone for seamless environm","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-14b/speech-to-video","name":"Wan-2.2 Speech-to-Video 14B","created_by":"fal","source":"official","family":"wan","description":"Wan-S2V is a video model that generates high-quality videos from static images and audio, with realistic facial expressions, body movements, and professional camera work for film and television applic","status":"active","release_date":"2025-08-27","model_type":"other","page_url":"https://fal.run/fal-ai/wan/v2.2-14b/speech-to-video","tagline":"Wan-S2V is a video model that generates high-quality videos from static images and audio, with realistic facial expressions, body movements, and professional camera work for film and television applic","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan/v2.2-5b/image-to-video","name":"Wan v2.2 5B","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 5B model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","status":"active","release_date":"2025-07-30","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-5b/image-to-video","tagline":"Wan 2.2's 5B model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-5b/text-to-image","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 5B model generates high-resolution, photorealistic images with powerful prompt understanding and fine-grained visual detail","status":"active","release_date":"2025-08-05","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.2-5b/text-to-image","tagline":"Wan 2.2's 5B model generates high-resolution, photorealistic images with powerful prompt understanding and fine-grained visual detail","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan/v2.2-5b/text-to-video/distill","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 5B distill model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","status":"active","release_date":"2025-08-06","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-5b/text-to-video/distill","tagline":"Wan 2.2's 5B distill model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan/v2.2-5b/text-to-video/fast-wan","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 5B FastVideo model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","status":"active","release_date":"2025-08-05","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-5b/text-to-video/fast-wan","tagline":"Wan 2.2's 5B FastVideo model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan/v2.2-5b/text-to-video","name":"Wan v2.2 5B","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 5B model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","status":"active","release_date":"2025-07-28","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-5b/text-to-video","tagline":"Wan 2.2's 5B model produces up to 5 seconds of video 720p at 24FPS with fluid motion and powerful prompt understanding","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-a14b/image-to-image","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 14B model edit high-resolution, photorealistic images with powerful prompt understanding and fine-grained visual detail","status":"active","release_date":"2025-09-03","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/image-to-image","tagline":"Wan 2.2's 14B model edit high-resolution, photorealistic images with powerful prompt understanding and fine-grained visual detail","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-a14b/image-to-video/lora","name":"Wan v2.2 A14B Image-to-Video A14B with LoRAs","created_by":"fal","source":"official","family":"wan","description":"Wan-2.2 image-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts and images.","status":"active","release_date":"2025-08-07","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/image-to-video/lora","tagline":"Wan-2.2 image-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts and images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan/v2.2-a14b/image-to-video/turbo","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan-2.2 Turbo image-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","status":"active","release_date":"2025-07-31","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/image-to-video/turbo","tagline":"Wan-2.2 Turbo image-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-a14b/image-to-video","name":"Wan v2.2 A14B","created_by":"fal","source":"official","family":"wan","description":"fal-ai/wan/v2.2-A14B/image-to-video","status":"active","release_date":"2025-07-28","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-a14B/image-to-video","tagline":"fal-ai/wan/v2.2-A14B/image-to-video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-a14b/text-to-image/lora","name":"Wan v2.2 A14B Text-to-Image A14B with LoRAs","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 14B model with LoRA support generates high-fidelity images with enhanced prompt alignment, style adaptability.","status":"active","release_date":"2025-08-05","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/text-to-image/lora","tagline":"Wan 2.2's 14B model with LoRA support generates high-fidelity images with enhanced prompt alignment, style adaptability.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan/v2.2-a14b/text-to-image","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan 2.2's 14B model generates high-resolution, photorealistic images with powerful prompt understanding and fine-grained visual detail","status":"active","release_date":"2025-08-05","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/text-to-image","tagline":"Wan 2.2's 14B model generates high-resolution, photorealistic images with powerful prompt understanding and fine-grained visual detail","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-a14b/text-to-video/lora","name":"Wan-2.2 Text-to-Video A14B with LoRAs","created_by":"fal","source":"official","family":"wan","description":"Wan-2.2 text-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","status":"active","release_date":"2025-08-07","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/text-to-video/lora","tagline":"Wan-2.2 text-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"fal-ai/wan/v2.2-a14b/text-to-video/turbo","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan-2.2 turbo text-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","status":"active","release_date":"2025-07-31","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/text-to-video/turbo","tagline":"Wan-2.2 turbo text-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-a14b/text-to-video","name":"Wan-2.2 Text-to-Video A14B","created_by":"fal","source":"official","family":"wan","description":"Wan-2.2 text-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","status":"active","release_date":"2025-07-28","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/text-to-video","tagline":"Wan-2.2 text-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.2-a14b/video-to-video","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan-2.2 video-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts and source videos.","status":"active","release_date":"2025-08-02","model_type":"other","page_url":"https://fal.run/fal-ai/wan/v2.2-a14b/video-to-video","tagline":"Wan-2.2 video-to-video is a video model that generates high-quality videos with high visual quality and motion diversity from text prompts and source videos.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/edit-video","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","status":"active","release_date":"2026-03-28","model_type":"other","page_url":"https://fal.run/fal-ai/wan/v2.7/edit-video","tagline":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/edit","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Transform and edit existing images with text-guided instructions using the WAN 2.7 model for creative image manipulation.","status":"active","release_date":"2026-04-01","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.7/edit","tagline":"Transform and edit existing images with text-guided instructions using the WAN 2.7 model for creative image manipulation.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/image-to-video","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","status":"active","release_date":"2026-03-28","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.7/image-to-video","tagline":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/pro/edit","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Edit and transform images using text instructions with the WAN 2.7 Pro model for precise, professional-grade image modifications.","status":"active","release_date":"2026-04-01","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.7/pro/edit","tagline":"Edit and transform images using text instructions with the WAN 2.7 Pro model for precise, professional-grade image modifications.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/pro/text-to-image","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Generate premium-quality images from text prompts using the enhanced WAN 2.7 Pro model with superior detail and composition.","status":"active","release_date":"2026-04-01","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.7/pro/text-to-image","tagline":"Generate premium-quality images from text prompts using the enhanced WAN 2.7 Pro model with superior detail and composition.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-20","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/reference-to-video","name":"Wan 2.7 Reference to Video","created_by":"fal","source":"official","family":"wan","description":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","status":"active","release_date":"2026-03-28","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.7/reference-to-video","tagline":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/text-to-image","name":"Wan","created_by":"fal","source":"official","family":"wan","description":"Generate high-quality images from text prompts using the WAN 2.7 model with advanced prompt understanding and detailed output.","status":"active","release_date":"2026-04-01","model_type":"image","page_url":"https://fal.run/fal-ai/wan/v2.7/text-to-image","tagline":"Generate high-quality images from text prompts using the WAN 2.7 model with advanced prompt understanding and detailed output.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-20","last_updated":"2026-05-11"},{"id":"fal-ai/wan/v2.7/text-to-video","name":"Wan Text to Video","created_by":"fal","source":"official","family":"wan","description":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","status":"active","release_date":"2026-03-28","model_type":"video","page_url":"https://fal.run/fal-ai/wan/v2.7/text-to-video","tagline":"Wan 2.7 is the latest generation AI video model, delivering enhanced motion smoothness, superior scene fidelity, and greater visual coherence.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-1-3b","name":"Wan Vace 1 3b","created_by":"fal","source":"official","family":"wan","description":"Vace a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-06-04","model_type":"other","parameters":3,"page_url":"https://fal.run/fal-ai/wan-vace-1-3b","tagline":"Vace a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-14b/depth","name":"Wan VACE 14B","created_by":"fal","source":"official","family":"wan","description":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace-14b/depth","tagline":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-14b/inpainting","name":"Wan VACE 14B","created_by":"fal","source":"official","family":"wan","description":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace-14b/inpainting","tagline":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-14b/outpainting","name":"Wan VACE 14B","created_by":"fal","source":"official","family":"wan","description":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace-14b/outpainting","tagline":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-14b/pose","name":"Wan VACE 14B","created_by":"fal","source":"official","family":"wan","description":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace-14b/pose","tagline":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-14b/reframe","name":"Wan VACE 14B","created_by":"fal","source":"official","family":"wan","description":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-06-18","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace-14b/reframe","tagline":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-14b","name":"Wan VACE 14B","created_by":"fal","source":"official","family":"wan","description":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-05-27","model_type":"other","parameters":14,"page_url":"https://fal.run/fal-ai/wan-vace-14b","tagline":"VACE is a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-apps/long-reframe","name":"Wan 2.1 VACE Long Reframe","created_by":"fal","source":"official","family":"wan","description":"Reframe entire videos scene-by-scene using Wan VACE 2.1","status":"active","release_date":"2025-10-07","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace-apps/long-reframe","tagline":"Reframe entire videos scene-by-scene using Wan VACE 2.1","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace-apps/video-edit","name":"Wan VACE Video Edit","created_by":"fal","source":"official","family":"wan","description":"Edit videos using plain language and Wan VACE","status":"active","release_date":"2025-09-22","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace-apps/video-edit","tagline":"Edit videos using plain language and Wan VACE","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vace","name":"Vace","created_by":"fal","source":"official","family":"wan","description":"Vace a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","status":"active","release_date":"2025-04-11","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vace","tagline":"Vace a video generation model that uses a source image, mask, and video to create prompted videos with controllable sources.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wan-vision-enhancer","name":"Wan Vision Enhancer","created_by":"fal","source":"official","family":"wan","description":"Wan Vision Enhancer for magnify/enhance video with high fidelity and creativity.","status":"active","release_date":"2025-12-10","model_type":"other","page_url":"https://fal.run/fal-ai/wan-vision-enhancer","tagline":"Wan Vision Enhancer for magnify/enhance video with high fidelity and creativity.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/wizper","name":"Wizper (Whisper v3 -- fal.ai edition)","created_by":"fal","source":"official","description":"[Experimental] Whisper v3 Large -- but optimized by our inference wizards.","status":"active","release_date":"2024-04-08","model_type":"transcription","page_url":"https://fal.run/fal-ai/wizper","tagline":"[Experimental] Whisper v3 Large -- but optimized by our inference wizards.","modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/workflow-utilities/audio-compressor","name":"Workflow Utilities Audio Compressor","created_by":"fal","source":"official","description":"FFMPEG Utility for Audio Compression","status":"active","release_date":"2026-02-05","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/audio-compressor","tagline":"FFMPEG Utility for Audio Compression","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/auto-subtitle","name":"Workflow Utilities Auto Subtitle","created_by":"fal","source":"official","description":"Add automatic subtitles to videos","status":"active","release_date":"2025-11-04","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/auto-subtitle","tagline":"Add automatic subtitles to videos","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/blend-video","name":"Workflow Utilities Blend Video","created_by":"fal","source":"official","description":"FFMPEG Utility for Blending Videos","status":"active","release_date":"2026-02-05","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/blend-video","tagline":"FFMPEG Utility for Blending Videos","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/extract-nth-frame","name":"Workflow Utilities Extract Nth Frame","created_by":"fal","source":"official","description":"FFMPEG Untility for Extracting nth Frame","status":"active","release_date":"2026-02-05","model_type":"image","page_url":"https://fal.run/fal-ai/workflow-utilities/extract-nth-frame","tagline":"FFMPEG Untility for Extracting nth Frame","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/impulse-response","name":"Workflow Utilities Impulse Response","created_by":"fal","source":"official","description":"FFMPEG Utility for Impulse Response","status":"active","release_date":"2026-02-05","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/impulse-response","tagline":"FFMPEG Utility for Impulse Response","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/interleave-video","name":"Workflow Utilities Interleave Video","created_by":"fal","source":"official","description":"ffmpeg utility to interleave videos","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/interleave-video","tagline":"ffmpeg utility to interleave videos","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/pick-image-by-index","name":"Workflow Utilities Pick Image By Index","created_by":"fal","source":"official","description":"Choose the Nth image from an image URL list for workflows.","status":"active","release_date":"2026-04-29","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/pick-image-by-index","tagline":"Choose the Nth image from an image URL list for workflows.","capabilities":{"vision":true},"last_seen_at":"2026-04-30","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/reverse-video","name":"Workflow Utilities Reverse Video","created_by":"fal","source":"official","description":"FFMPEG Utility to Reverse Videos","status":"active","release_date":"2026-02-19","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/reverse-video","tagline":"FFMPEG Utility to Reverse Videos","last_seen_at":"2026-02-19","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/scale-video","name":"Workflow Utilities Scale Video","created_by":"fal","source":"official","description":"FFMPEG Utilities to Scale Videos","status":"active","release_date":"2026-02-16","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/scale-video","tagline":"FFMPEG Utilities to Scale Videos","last_seen_at":"2026-02-17","last_updated":"2026-06-03"},{"id":"fal-ai/workflow-utilities/trim-video","name":"Workflow Utilities Trim Video","created_by":"fal","source":"official","description":"FFMPEG Utility for Trim Video","status":"active","release_date":"2026-02-11","model_type":"other","page_url":"https://fal.run/fal-ai/workflow-utilities/trim-video","tagline":"FFMPEG Utility for Trim Video","last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/x-ailab/nsfw","name":"NSFW Checker","created_by":"fal","source":"official","description":"Predict whether an image is NSFW or SFW.","status":"active","release_date":"2025-07-28","model_type":"other","page_url":"https://fal.run/fal-ai/x-ailab/nsfw","tagline":"Predict whether an image is NSFW or SFW.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/yue","name":"YuE: Lyrics to Song","created_by":"fal","source":"official","description":"YuE is a groundbreaking series of open-source foundation models designed for music generation, specifically for transforming lyrics into full songs.","status":"active","release_date":"2025-01-28","model_type":"other","page_url":"https://fal.run/fal-ai/yue","tagline":"YuE is a groundbreaking series of open-source foundation models designed for music generation, specifically for transforming lyrics into full songs.","last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/z-image/base/lora","name":"Z Image Base Lora","created_by":"fal","source":"official","description":"LoRA endpoint for Z-Image, the foundation model of the Z- Image family.","status":"active","release_date":"2026-01-27","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/base/lora","tagline":"LoRA endpoint for Z-Image, the foundation model of the Z- Image family.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-06-03"},{"id":"fal-ai/z-image-base-trainer","name":"Z-Image Trainer","created_by":"fal","source":"official","description":"Fast LoRA trainer for Z-Image, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","status":"active","release_date":"2026-01-27","model_type":"other","page_url":"https://fal.run/fal-ai/z-image-base-trainer","tagline":"Fast LoRA trainer for Z-Image, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","capabilities":{"vision":true},"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/z-image/base","name":"Z Image Base","created_by":"fal","source":"official","description":"Z-Image is the foundation model of the Z- Image family, engineered for good quality, robust generative diversity, broad stylistic coverage, and precise prompt adherence.","status":"active","release_date":"2026-01-27","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/base","tagline":"Z-Image is the foundation model of the Z- Image family, engineered for good quality, robust generative diversity, broad stylistic coverage, and precise prompt adherence.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/z-image-trainer","name":"Z Image Trainer","created_by":"fal","source":"official","description":"Train LoRAs on Z-Image Turbo, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","status":"active","release_date":"2025-12-03","model_type":"other","page_url":"https://fal.run/fal-ai/z-image-trainer","tagline":"Train LoRAs on Z-Image Turbo, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/z-image/turbo/controlnet/lora","name":"Z Image Turbo Controlnet Lora","created_by":"fal","source":"official","description":"Generate images from text and edge, depth or pose images using custom LoRA and Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","status":"active","release_date":"2025-12-07","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/controlnet/lora","tagline":"Generate images from text and edge, depth or pose images using custom LoRA and Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/controlnet","name":"Z Image Turbo Controlnet","created_by":"fal","source":"official","description":"Generate images from text and edge, depth or pose images using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","status":"active","release_date":"2025-12-07","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/controlnet","tagline":"Generate images from text and edge, depth or pose images using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/image-to-image/lora","name":"Z Image Turbo Image To Image Lora","created_by":"fal","source":"official","description":"Generate images from text and images using custom LoRA and Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","status":"active","release_date":"2025-12-07","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/image-to-image/lora","tagline":"Generate images from text and images using custom LoRA and Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/image-to-image","name":"Z Image Turbo Image To Image","created_by":"fal","source":"official","description":"Generate images from text and images using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","status":"active","release_date":"2025-12-07","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/image-to-image","tagline":"Generate images from text and images using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/inpaint/lora","name":"Z Image Turbo Inpaint Lora","created_by":"fal","source":"official","description":"Generate images from text, an image, a mask and custom LoRA using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","status":"active","release_date":"2025-12-18","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/inpaint/lora","tagline":"Generate images from text, an image, a mask and custom LoRA using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/inpaint","name":"Z Image Turbo Inpaint","created_by":"fal","source":"official","description":"Generate images from text, an image and a mask using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","status":"active","release_date":"2025-12-18","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/inpaint","tagline":"Generate images from text, an image and a mask using Z-Image Turbo, Tongyi-MAI's super-fast 6B model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/lora","name":"Z Image Turbo Lora","created_by":"fal","source":"official","description":"Text-to-Image endpoint with LoRA support for Z-Image Turbo, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","status":"active","release_date":"2025-12-01","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/lora","tagline":"Text-to-Image endpoint with LoRA support for Z-Image Turbo, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-28","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/tiling/lora","name":"Z-Image Turbo Seamless Tiling Lora","created_by":"fal","source":"official","description":"Generate seamlessly tiling photorealistic images from text using Z-Image Turbo and custom LoRA","status":"active","release_date":"2026-03-17","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/tiling/lora","tagline":"Generate seamlessly tiling photorealistic images from text using Z-Image Turbo and custom LoRA","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-06-03"},{"id":"fal-ai/z-image/turbo/tiling","name":"Z-Image Turbo Seamless Tiling","created_by":"fal","source":"official","description":"Generate seamlessly tiling photorealistic images from text using Z-Image Turbo","status":"active","release_date":"2026-03-17","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo/tiling","tagline":"Generate seamlessly tiling photorealistic images from text using Z-Image Turbo","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"fal-ai/z-image-turbo-trainer-v2","name":"Z Image Turbo Trainer V2","created_by":"fal","source":"official","description":"Fast LoRA trainer for Z-Image-Turbo, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","status":"active","release_date":"2026-01-24","model_type":"other","page_url":"https://fal.run/fal-ai/z-image-turbo-trainer-v2","tagline":"Fast LoRA trainer for Z-Image-Turbo, a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","capabilities":{"vision":true},"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"fal-ai/z-image/turbo","name":"Z Image Turbo","created_by":"fal","source":"official","description":"Z-Image Turbo is a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","status":"active","release_date":"2025-11-26","model_type":"image","page_url":"https://fal.run/fal-ai/z-image/turbo","tagline":"Z-Image Turbo is a super fast text-to-image model of 6B parameters developed by Tongyi-MAI.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-30","last_updated":"2026-06-30"},{"id":"fal-ai/zonos","name":"Zonos-Audio-Clone","created_by":"fal","source":"official","description":"Clone voice of any person and speak anything in their voice using zonos' voice cloning.","status":"active","release_date":"2025-02-14","model_type":"other","page_url":"https://fal.run/fal-ai/zonos","tagline":"Clone voice of any person and speak anything in their voice using zonos' voice cloning.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"fal-ai/zonos2","name":"Zonos2 Text to Speech","created_by":"fal","source":"official","description":"Zonos2 is a text-to-speech model that clones a voice from a short sample and speaks naturally across many languages.","status":"active","release_date":"2026-06-16","model_type":"tts","page_url":"https://fal.run/fal-ai/zonos2","tagline":"Zonos2 is a text-to-speech model that clones a voice from a short sample and speaks naturally across many languages.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-16","last_updated":"2026-06-18"},{"id":"ideogram/v4/image-to-image/lora","name":"Ideogram V4.0q Image to Image LoRA","created_by":"ideogram","source":"official","description":"Ideogram V4.0q Image-to-Image LoRA applies a custom-trained LoRA on top of an input image, steering edits toward a specific style, subject, or brand identity while keeping the source composition intac","status":"active","release_date":"2026-06-10","model_type":"image","page_url":"https://fal.run/ideogram/v4/image-to-image/lora","tagline":"Ideogram V4.0q Image-to-Image LoRA applies a custom-trained LoRA on top of an input image, steering edits toward a specific style, subject, or brand identity while keeping the source composition intac","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"ideogram/v4/image-to-image","name":"Ideogram V4.0q Image to Image","created_by":"ideogram","source":"official","description":"Ideogram V4.0q Image-to-Image transforms an input image with a text prompt, restyling and reworking the composition while preserving its core structure for prompt-faithful, high-fidelity edits.","status":"active","release_date":"2026-06-10","model_type":"image","page_url":"https://fal.run/ideogram/v4/image-to-image","tagline":"Ideogram V4.0q Image-to-Image transforms an input image with a text prompt, restyling and reworking the composition while preserving its core structure for prompt-faithful, high-fidelity edits.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"ideogram/v4/lora","name":"Ideogram V4.0q Text to Image (LoRA)","created_by":"ideogram","source":"official","description":"Generate high-quality images, posters, and logos with Ideogram's latest V4.0q using LoRA — producing crisp visuals with accurate text rendering, fine detail, and full creative control for polished, re","status":"active","release_date":"2026-06-08","model_type":"image","page_url":"https://fal.run/ideogram/v4/lora","tagline":"Generate high-quality images, posters, and logos with Ideogram's latest V4.0q using LoRA — producing crisp visuals with accurate text rendering, fine detail, and full creative control for polished, re","capabilities":{"vision":true,"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"ideogram/v4/tiling/lora","name":"Ideogram V4.0q Tiling LoRA","created_by":"ideogram","source":"official","description":"Ideogram V4.0q Tiling LoRA produces seamless repeatable patterns guided by a custom-trained LoRA, locking a specific aesthetic or motif into tileable textures for cohesive, large-scale surface design.","status":"active","release_date":"2026-06-10","model_type":"image","page_url":"https://fal.run/ideogram/v4/tiling/lora","tagline":"Ideogram V4.0q Tiling LoRA produces seamless repeatable patterns guided by a custom-trained LoRA, locking a specific aesthetic or motif into tileable textures for cohesive, large-scale surface design.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"ideogram/v4/tiling","name":"Ideogram V4.0q Tiling","created_by":"ideogram","source":"official","description":"Ideogram V4.0q Tiling generates seamless, edge-matching textures and patterns that repeat infinitely in any direction, ideal for backgrounds, surfaces, and wallpapers.","status":"active","release_date":"2026-06-10","model_type":"image","page_url":"https://fal.run/ideogram/v4/tiling","tagline":"Ideogram V4.0q Tiling generates seamless, edge-matching textures and patterns that repeat infinitely in any direction, ideal for backgrounds, surfaces, and wallpapers.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-19","last_updated":"2026-06-20"},{"id":"ideogram/v4/trainer","name":"Ideogram V4.0q LoRA Trainer","created_by":"ideogram","source":"official","description":"Train custom LoRAs for personalization, styles or other use cases on top of Ideogram V4.","status":"active","release_date":"2026-06-09","model_type":"other","page_url":"https://fal.run/ideogram/v4/trainer","tagline":"Train custom LoRAs for personalization, styles or other use cases on top of Ideogram V4.","last_seen_at":"2026-06-10","last_updated":"2026-06-10"},{"id":"ideogram/v4","name":"Ideogram V4.0 Text to Image","created_by":"ideogram","source":"official","description":"Generate high-quality images, posters, and logos with Ideogram's latest V4.0q — producing crisp visuals with accurate text rendering, fine detail, and full creative control for polished, ready-to-use ","status":"active","release_date":"2026-06-02","model_type":"image","page_url":"https://fal.run/ideogram/v4","tagline":"Generate high-quality images, posters, and logos with Ideogram's latest V4.0q — producing crisp visuals with accurate text rendering, fine detail, and full creative control for polished, ready-to-use ","capabilities":{"vision":true,"streaming":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"imagineart/imagineart-1.5-preview/text-to-image","name":"Imagineart 1.5 Preview","created_by":"imagineart","source":"official","description":"ImagineArt 1.5 text-to-image model generates high-fidelity professional-grade visuals with lifelike realism, strong aesthetics, and text that actually reads correctly.","status":"active","release_date":"2025-11-20","model_type":"image","page_url":"https://fal.run/imagineart/imagineart-1.5-preview/text-to-image","tagline":"ImagineArt 1.5 text-to-image model generates high-fidelity professional-grade visuals with lifelike realism, strong aesthetics, and text that actually reads correctly.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"imagineart/imagineart-1.5-pro-preview/text-to-image","name":"ImagineArt 1.5 Pro Preview","created_by":"imagineart","source":"official","description":"ImagineArt 1.5 Pro is an advanced text-to-image model that creates ultra-high-fidelity 4K visuals with lifelike realism, refined aesthetics, and powerful creative output suited for professional use.","status":"active","release_date":"2026-01-15","model_type":"image","page_url":"https://fal.run/imagineart/imagineart-1.5-pro-preview/text-to-image","tagline":"ImagineArt 1.5 Pro is an advanced text-to-image model that creates ultra-high-fidelity 4K visuals with lifelike realism, refined aesthetics, and powerful creative output suited for professional use.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"imagineart/imagineart-2.0-edit-preview/image-to-image","name":"Imagineart 2.0 Edit Preview","created_by":"imagineart","source":"official","description":"ImagineArt 2.0 Edit delivers precise prompt-guided image editing at 2K resolution, preserving fine detail and realism while accurately applying targeted changes across one or more reference images.","status":"active","release_date":"2026-05-19","model_type":"image","page_url":"https://fal.run/imagineart/imagineart-2.0-edit-preview/image-to-image","tagline":"ImagineArt 2.0 Edit delivers precise prompt-guided image editing at 2K resolution, preserving fine detail and realism while accurately applying targeted changes across one or more reference images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-19","last_updated":"2026-06-03"},{"id":"imagineart/imagineart-2.0-preview/text-to-image","name":"Imagineart 2.0 Preview","created_by":"imagineart","source":"official","description":"ImagineArt 2.0 is ImagineArt's latest state-of-the-art visual reasoning text-to-image model, generating high-fidelity, professional-grade visuals with lifelike realism, cinematic effects, and strong a","status":"active","release_date":"2026-04-13","model_type":"image","page_url":"https://fal.run/imagineart/imagineart-2.0-preview/text-to-image","tagline":"ImagineArt 2.0 is ImagineArt's latest state-of-the-art visual reasoning text-to-image model, generating high-fidelity, professional-grade visuals with lifelike realism, cinematic effects, and strong a","capabilities":{"vision":true,"reasoning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-21","last_updated":"2026-05-11"},{"id":"krea/v2/large/text-to-image","name":"Krea 2 Large","created_by":"krea","source":"official","description":"Generate high-fidelity images from text with Krea 2 Large, supporting aspect ratio, creativity, seed controls, and optional style references.","status":"active","release_date":"2026-05-27","model_type":"image","page_url":"https://fal.run/krea/v2/large/text-to-image","tagline":"Generate high-fidelity images from text with Krea 2 Large, supporting aspect ratio, creativity, seed controls, and optional style references.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-11","last_updated":"2026-06-18"},{"id":"krea/v2/medium/text-to-image","name":"Krea 2 Medium","created_by":"krea","source":"official","description":"Generate high-quality images from text with Krea 2 Medium, supporting aspect ratio, creativity controls, seeds, and optional style references.","status":"active","release_date":"2026-05-27","model_type":"image","page_url":"https://fal.run/krea/v2/medium/text-to-image","tagline":"Generate high-quality images from text with Krea 2 Medium, supporting aspect ratio, creativity controls, seeds, and optional style references.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-29","last_updated":"2026-06-03"},{"id":"krea/v2/medium/turbo/text-to-image","name":"Krea 2 Medium Text to Image Turbo","created_by":"krea","source":"official","description":"Generate high-fidelity images extremely fast from text with Krea 2 Medium Turbo, supporting aspect ratio, creativity, seed controls, and optional style references.","status":"active","release_date":"2026-06-03","model_type":"image","page_url":"https://fal.run/krea/v2/medium/turbo/text-to-image","tagline":"Generate high-fidelity images extremely fast from text with Krea 2 Medium Turbo, supporting aspect ratio, creativity, seed controls, and optional style references.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-17","last_updated":"2026-06-18"},{"id":"luma/agent/ray/v3.2/image-to-video","name":"Luma Ray 3.2 Image to Video","created_by":"luma","source":"official","description":"Luma Ray 3.2 animates a source image into cinematic motion guided by a text prompt, preserving the starting frame's look while controlling resolution, duration, and seamless looping.","status":"active","release_date":"2026-06-09","model_type":"video","page_url":"https://fal.run/luma/agent/ray/v3.2/image-to-video","tagline":"Luma Ray 3.2 animates a source image into cinematic motion guided by a text prompt, preserving the starting frame's look while controlling resolution, duration, and seamless looping.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"luma/agent/ray/v3.2/reframe","name":"Luma Ray 3.2 Reframe","created_by":"luma","source":"official","description":"Luma Ray 3.2 reframes an existing video into a new aspect ratio guided by a text prompt, preserving the original footage frame-for-frame while controlling resolution and outpainting the surrounding ca","status":"active","release_date":"2026-06-11","model_type":"other","page_url":"https://fal.run/luma/agent/ray/v3.2/reframe","tagline":"Luma Ray 3.2 reframes an existing video into a new aspect ratio guided by a text prompt, preserving the original footage frame-for-frame while controlling resolution and outpainting the surrounding ca","last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"luma/agent/ray/v3.2/text-to-video","name":"Luma Ray 3.2 Text to Video","created_by":"luma","source":"official","description":"Luma Ray 3.2 generates cinematic video from a text prompt, with control over resolution, duration, and seamless looping, plus reference images to lock in subject and style.","status":"active","release_date":"2026-06-09","model_type":"video","page_url":"https://fal.run/luma/agent/ray/v3.2/text-to-video","tagline":"Luma Ray 3.2 generates cinematic video from a text prompt, with control over resolution, duration, and seamless looping, plus reference images to lock in subject and style.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"luma/agent/ray/v3.2/video-to-video","name":"Luma Ray 3.2 Video to Video","created_by":"luma","source":"official","description":"Luma Ray 3.2 re-renders an existing video into new cinematic motion guided by a text prompt, preserving the source's look and movement while controlling resolution, duration, and HDR.","status":"active","release_date":"2026-06-11","model_type":"other","page_url":"https://fal.run/luma/agent/ray/v3.2/video-to-video","tagline":"Luma Ray 3.2 re-renders an existing video into new cinematic motion guided by a text prompt, preserving the source's look and movement while controlling resolution, duration, and HDR.","last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"luma/agent/uni-1/v1/edit","name":"Luma Uni-1 Edit","created_by":"luma","source":"official","description":"Luma Uni-1 Edit reworks a source image from a text instruction, preserving the original composition while applying style changes and following optional reference images to steer the result.","status":"active","release_date":"2026-06-09","model_type":"image","page_url":"https://fal.run/luma/agent/uni-1/v1/edit","tagline":"Luma Uni-1 Edit reworks a source image from a text instruction, preserving the original composition while applying style changes and following optional reference images to steer the result.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"luma/agent/uni-1/v1/max/edit","name":"Luma Uni-1 Edit Max","created_by":"luma","source":"official","description":"Luma Uni-1 Max Edit applies text-guided edits to a source image at maximum fidelity, holding the original structure while honoring reference images for precise, high-detail revisions.","status":"active","release_date":"2026-06-09","model_type":"image","page_url":"https://fal.run/luma/agent/uni-1/v1/max/edit","tagline":"Luma Uni-1 Max Edit applies text-guided edits to a source image at maximum fidelity, holding the original structure while honoring reference images for precise, high-detail revisions.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"luma/agent/uni-1/v1/max","name":"Luma Uni-1 Text to Image Max","created_by":"luma","source":"official","description":"Luma Uni-1 Max generates a single image at the model's highest fidelity, delivering richer detail and stronger prompt adherence than the base tier for hero-quality stills.","status":"active","release_date":"2026-06-09","model_type":"image","page_url":"https://fal.run/luma/agent/uni-1/v1/max","tagline":"Luma Uni-1 Max generates a single image at the model's highest fidelity, delivering richer detail and stronger prompt adherence than the base tier for hero-quality stills.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"luma/agent/uni-1/v1/text-to-image","name":"Luma Uni-1 Text to Image","created_by":"luma","source":"official","description":"Luma Uni-1 turns a text prompt into a single high-fidelity image, with control over aspect ratio and visual style, plus optional web-sourced and reference-image guidance for sharper grounding.","status":"active","release_date":"2026-06-09","model_type":"image","page_url":"https://fal.run/luma/agent/uni-1/v1/text-to-image","tagline":"Luma Uni-1 turns a text prompt into a single high-fidelity image, with control over aspect ratio and visual style, plus optional web-sourced and reference-image guidance for sharper grounding.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-15","last_updated":"2026-06-18"},{"id":"microsoft/mai-image-2.5/edit","name":"Mai Image 2.5","created_by":"microsoft","source":"official","description":"MAI-Image-2.5 is Microsoft's photorealistic image generation and editing model that turns text prompts or uploaded images into high-quality, design-ready visuals with fine-grained, pixel-level control","status":"active","release_date":"2026-06-03","model_type":"image","page_url":"https://fal.run/microsoft/mai-image-2.5/edit","tagline":"MAI-Image-2.5 is Microsoft's photorealistic image generation and editing model that turns text prompts or uploaded images into high-quality, design-ready visuals with fine-grained, pixel-level control","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-04","last_updated":"2026-06-10"},{"id":"microsoft/mai-image-2.5","name":"Mai Image 2.5 Text to Image","created_by":"microsoft","source":"official","description":"MAI-Image-2.5 is Microsoft's photorealistic image generation and editing model that turns text prompts or uploaded images into high-quality, design-ready visuals with fine-grained, pixel-level control","status":"active","release_date":"2026-06-02","model_type":"image","page_url":"https://fal.run/microsoft/mai-image-2.5","tagline":"MAI-Image-2.5 is Microsoft's photorealistic image generation and editing model that turns text prompts or uploaded images into high-quality, design-ready visuals with fine-grained, pixel-level control","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"mirelo-ai/sfx-v1/video-to-audio","name":"Mirelo SFX","created_by":"mirelo-ai","source":"official","description":"Generate synced sounds for any video, and return the new sound track (like MMAudio)","status":"active","release_date":"2025-08-15","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx-v1/video-to-audio","tagline":"Generate synced sounds for any video, and return the new sound track (like MMAudio)","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"mirelo-ai/sfx-v1/video-to-video","name":"Mirelo SFX","created_by":"mirelo-ai","source":"official","description":"Generate synced sounds for any video, and return it with its new sound track (like MMAudio)\n","status":"active","release_date":"2025-08-14","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx-v1/video-to-video","tagline":"Generate synced sounds for any video, and return it with its new sound track (like MMAudio)\n","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"mirelo-ai/sfx-v1.5/video-to-audio","name":"Mirelo SFX V1.5","created_by":"mirelo-ai","source":"official","description":"Generate synced sounds for any video, and return the new sound track (like MMAudio)","status":"active","release_date":"2025-10-15","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx-v1.5/video-to-audio","tagline":"Generate synced sounds for any video, and return the new sound track (like MMAudio)","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"mirelo-ai/sfx-v1.5/video-to-video","name":"Mirelo SFX V1.5","created_by":"mirelo-ai","source":"official","description":"Generate synced sounds for any video, and return it with its new sound track (like MMAudio)","status":"active","release_date":"2025-10-15","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx-v1.5/video-to-video","tagline":"Generate synced sounds for any video, and return it with its new sound track (like MMAudio)","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"mirelo-ai/sfx1.6/extend-audio","name":"Mirelo SFX1.6","created_by":"mirelo-ai","source":"official","description":"Extend any sound effect with seamless, natural tails.","status":"active","release_date":"2026-05-18","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx1.6/extend-audio","tagline":"Extend any sound effect with seamless, natural tails.","last_seen_at":"2026-05-19","last_updated":"2026-06-03"},{"id":"mirelo-ai/sfx1.6/inpaint-audio","name":"Mirelo SFX1.6","created_by":"mirelo-ai","source":"official","description":"Erase and replace any moment in your audio with AI-driven precision.","status":"active","release_date":"2026-05-18","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx1.6/inpaint-audio","tagline":"Erase and replace any moment in your audio with AI-driven precision.","last_seen_at":"2026-05-19","last_updated":"2026-06-03"},{"id":"mirelo-ai/sfx1.6/text-to-audio","name":"Mirelo SFX1.6","created_by":"mirelo-ai","source":"official","description":"Generate ambient sounds for any text prompt.","status":"active","release_date":"2026-05-15","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx1.6/text-to-audio","tagline":"Generate ambient sounds for any text prompt.","last_seen_at":"2026-05-19","last_updated":"2026-06-03"},{"id":"mirelo-ai/sfx1.6/video-to-video","name":"Mirelo SFX1.6","created_by":"mirelo-ai","source":"official","description":"Generate synced sounds for any video, and return it with its new sound track (like MMAudio).","status":"active","release_date":"2026-05-18","model_type":"other","page_url":"https://fal.run/mirelo-ai/sfx1.6/video-to-video","tagline":"Generate synced sounds for any video, and return it with its new sound track (like MMAudio).","last_seen_at":"2026-05-19","last_updated":"2026-06-03"},{"id":"moonvalley/marey/i2v","name":"Marey Realism V1.5","created_by":"moonvalley","source":"official","description":"Generate a video starting from an image as the first frame with Marey, a generative video model trained exclusively on fully licensed data.","status":"active","release_date":"2025-08-14","model_type":"video","page_url":"https://fal.run/moonvalley/marey/i2v","tagline":"Generate a video starting from an image as the first frame with Marey, a generative video model trained exclusively on fully licensed data.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"moonvalley/marey/motion-transfer","name":"Marey Realism V1.5","created_by":"moonvalley","source":"official","description":"Pull motion from a reference video and apply it to new subjects or scenes.","status":"active","release_date":"2025-08-14","model_type":"other","page_url":"https://fal.run/moonvalley/marey/motion-transfer","tagline":"Pull motion from a reference video and apply it to new subjects or scenes.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"moonvalley/marey/pose-transfer","name":"Marey Realism V1.5","created_by":"moonvalley","source":"official","description":"Ideal for matching human movement.","status":"active","release_date":"2025-08-14","model_type":"other","page_url":"https://fal.run/moonvalley/marey/pose-transfer","tagline":"Ideal for matching human movement.","last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"moonvalley/marey/t2v","name":"Marey Realism V1.5","created_by":"moonvalley","source":"official","description":"Generate a video from a text prompt with Marey, a generative video model trained exclusively on fully licensed data.","status":"active","release_date":"2025-08-14","model_type":"video","page_url":"https://fal.run/moonvalley/marey/t2v","tagline":"Generate a video from a text prompt with Marey, a generative video model trained exclusively on fully licensed data.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"nvidia/cosmos-3-super/image-to-video","name":"Cosmos 3 Super Image to Video","created_by":"nvidia","source":"official","description":"Cosmos3 is a collection of Omnimodal world models capable of generating dynamic, high-quality video, image, audio, and action commands from combinations of text, image, video, and action trajectory in","status":"active","release_date":"2026-06-01","model_type":"video","page_url":"https://fal.run/nvidia/cosmos-3-super/image-to-video","tagline":"Cosmos3 is a collection of Omnimodal world models capable of generating dynamic, high-quality video, image, audio, and action commands from combinations of text, image, video, and action trajectory in","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-02","last_updated":"2026-06-03"},{"id":"nvidia/cosmos-3-super/text-to-image","name":"Cosmos 3 Super","created_by":"nvidia","source":"official","description":"Cosmos3 is a collection of Omnimodal world models capable of generating dynamic, high-quality video, image, audio, and action commands from combinations of text, image, video, and action trajectory in","status":"active","release_date":"2026-06-01","model_type":"image","page_url":"https://fal.run/nvidia/cosmos-3-super/text-to-image","tagline":"Cosmos3 is a collection of Omnimodal world models capable of generating dynamic, high-quality video, image, audio, and action commands from combinations of text, image, video, and action trajectory in","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-02","last_updated":"2026-06-03"},{"id":"nvidia/nemotron-3-nano-omni/audio","name":"Nemotron 3 Nano Omni","created_by":"nvidia","source":"official","description":"Audio reasoning variant of NVIDIA's Nemotron 3 Nano Omni.","status":"active","release_date":"2026-04-27","model_type":"transcription","page_url":"https://fal.run/nvidia/nemotron-3-nano-omni/audio","tagline":"Audio reasoning variant of NVIDIA's Nemotron 3 Nano Omni.","capabilities":{"reasoning":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-04-30","last_updated":"2026-05-11"},{"id":"nvidia/nemotron-3-nano-omni/video","name":"Nemotron 3 Nano Omni","created_by":"nvidia","source":"official","description":"Video reasoning variant of NVIDIA's Nemotron 3 Nano Omni.","status":"active","release_date":"2026-04-27","model_type":"other","page_url":"https://fal.run/nvidia/nemotron-3-nano-omni/video","tagline":"Video reasoning variant of NVIDIA's Nemotron 3 Nano Omni.","capabilities":{"reasoning":true},"last_seen_at":"2026-05-13","last_updated":"2026-06-03"},{"id":"nvidia/nemotron-3-nano-omni/vision","name":"Nemotron 3 Nano Omni","created_by":"nvidia","source":"official","description":"Vision reasoning variant of NVIDIA's Nemotron 3 Nano Omni.","status":"active","release_date":"2026-04-27","model_type":"other","page_url":"https://fal.run/nvidia/nemotron-3-nano-omni/vision","tagline":"Vision reasoning variant of NVIDIA's Nemotron 3 Nano Omni.","capabilities":{"vision":true,"reasoning":true},"last_seen_at":"2026-04-30","last_updated":"2026-05-11"},{"id":"nvidia/nemotron-3-nano-omni","name":"Nemotron 3 Nano Omni","created_by":"nvidia","source":"official","description":"Open, efficient reasoning model from NVIDIA.","status":"active","release_date":"2026-04-27","model_type":"other","page_url":"https://fal.run/nvidia/nemotron-3-nano-omni","tagline":"Open, efficient reasoning model from NVIDIA.","capabilities":{"reasoning":true},"last_seen_at":"2026-04-30","last_updated":"2026-05-11"},{"id":"nvidia/nemotron-asr-multilingual/asr","name":"Nemotron Asr Multilingual","created_by":"nvidia","source":"official","description":"Nemotron-ASR-Streaming is a multi lingual, streaming Automatic Speech Recognition (ASR) engineered to deliver high-quality multi lingual transcription across both low-latency streaming and high-throug","status":"active","release_date":"2026-06-01","model_type":"transcription","page_url":"https://fal.run/nvidia/nemotron-asr-multilingual/asr","tagline":"Nemotron-ASR-Streaming is a multi lingual, streaming Automatic Speech Recognition (ASR) engineered to deliver high-quality multi lingual transcription across both low-latency streaming and high-throug","capabilities":{"streaming":true},"modalities":{"input":["audio"],"output":["text"]},"endpoints":["audio_transcriptions"],"last_seen_at":"2026-06-10","last_updated":"2026-06-18"},{"id":"openai/gpt-image-2/edit","name":"GPT Image 2 API","created_by":"openai","source":"official","family":"gpt-image-2","description":"GPT Image 2, OpenAI's latest image model, is capable of making fine-grained, detailed edits to images.","status":"active","release_date":"2026-04-20","model_type":"image","page_url":"https://fal.run/openai/gpt-image-2/edit","tagline":"GPT Image 2, OpenAI's latest image model, is capable of making fine-grained, detailed edits to images.","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-02","last_updated":"2026-06-03"},{"id":"openai/gpt-image-2","name":"GPT Image 2 API","created_by":"openai","source":"official","family":"gpt-image-2","description":"GPT Image 2, OpenAI's latest image model, is capable of creating extremely detailed images with fine typography.","status":"active","release_date":"2026-04-20","model_type":"image","page_url":"https://fal.run/openai/gpt-image-2","tagline":"GPT Image 2, OpenAI's latest image model, is capable of creating extremely detailed images with fine typography.","capabilities":{"streaming":true,"vision":true,"tool_call":false,"structured_output":false,"json_mode":false,"fine_tuning":false,"reasoning":false,"batch":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-11","last_updated":"2026-06-18","license":"proprietary","open_weight":false},{"id":"openrouter/router/audio","name":"OpenRouter [Audio]","created_by":"openrouter","source":"official","description":" Run any audio capable LLM with fal.","status":"active","release_date":"2025-12-22","model_type":"other","page_url":"https://fal.run/openrouter/router/audio","tagline":" Run any audio capable LLM with fal.","last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"openrouter/router/enterprise","name":"OpenRouter [Enterprise]","created_by":"openrouter","source":"official","description":"Run any LLM (Large Language Model) with fal, powered by OpenRouter.","status":"active","release_date":"2025-12-22","model_type":"other","page_url":"https://fal.run/openrouter/router/enterprise","tagline":"Run any LLM (Large Language Model) with fal, powered by OpenRouter.","capabilities":{"streaming":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"openrouter/router/openai/v1/chat/completions","name":"OpenRouter Chat Completions [OpenAI Compatible]","created_by":"openrouter","source":"official","description":"OpenAI-compatible chat completions API.","status":"active","release_date":"2025-11-12","model_type":"other","page_url":"https://fal.run/openrouter/router/openai/v1/chat/completions","tagline":"OpenAI-compatible chat completions API.","last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"openrouter/router/openai/v1/embeddings","name":"OpenRouter Embeddings [OpenAI Compatible]","created_by":"openrouter","source":"official","description":"Generate text embeddings using OpenAI-compatible API.","status":"active","release_date":"2025-11-12","model_type":"other","page_url":"https://fal.run/openrouter/router/openai/v1/embeddings","tagline":"Generate text embeddings using OpenAI-compatible API.","last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"openrouter/router/openai/v1/responses","name":"OpenRouter Responses [OpenAI Compatible]","created_by":"openrouter","source":"official","description":"The OpenRouter Responses API with fal, powered by OpenRouter, provides unified access to a wide range of large language models - including GPT, Claude, Gemini, and many others through a single API int","status":"active","release_date":"2025-11-13","model_type":"other","page_url":"https://fal.run/openrouter/router/openai/v1/responses","tagline":"The OpenRouter Responses API with fal, powered by OpenRouter, provides unified access to a wide range of large language models - including GPT, Claude, Gemini, and many others through a single API int","last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"openrouter/router/video/enterprise","name":"OpenRouter [Video][Enterprise]","created_by":"openrouter","source":"official","description":"Run any VLM (Video Language Model) with fal, powered by OpenRouter.","status":"active","release_date":"2026-01-13","model_type":"other","page_url":"https://fal.run/openrouter/router/video/enterprise","tagline":"Run any VLM (Video Language Model) with fal, powered by OpenRouter.","capabilities":{"streaming":true},"last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"openrouter/router/video","name":"OpenRouter [Video]","created_by":"openrouter","source":"official","description":"Run any video-capable LLM with fal.","status":"active","release_date":"2026-01-13","model_type":"other","page_url":"https://fal.run/openrouter/router/video","tagline":"Run any video-capable LLM with fal.","capabilities":{"streaming":true},"last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"openrouter/router/vision","name":"OpenRouter [Vision]","created_by":"openrouter","source":"official","description":"Run any Vision Language Model with fal.","status":"active","release_date":"2025-11-12","model_type":"other","page_url":"https://fal.run/openrouter/router/vision","tagline":"Run any Vision Language Model with fal.","capabilities":{"streaming":true,"vision":true},"last_seen_at":"2026-06-26","last_updated":"2026-06-29"},{"id":"openrouter/router","name":"OpenRouter","created_by":"openrouter","source":"official","description":"Run any LLM with fal.","status":"active","release_date":"2025-11-12","model_type":"other","page_url":"https://fal.run/openrouter/router","tagline":"Run any LLM with fal.","capabilities":{"streaming":true,"reasoning":true,"structured_output":true,"json_mode":true},"last_seen_at":"2026-05-06","last_updated":"2026-05-11"},{"id":"perceptron/isaac-01/openai/v1/chat/completions","name":"Isaac 0.1 [OpenAI Compatible Endpoint]","created_by":"perceptron","source":"official","description":"OpenAI spec compatible endpoint of Isaac-01 which is a multimodal vision-language model from Perceptron for various vision language tasks.","status":"active","release_date":"2025-09-17","model_type":"other","page_url":"https://fal.run/perceptron/isaac-01/openai/v1/chat/completions","tagline":"OpenAI spec compatible endpoint of Isaac-01 which is a multimodal vision-language model from Perceptron for various vision language tasks.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"perceptron/isaac-01","name":"Isaac 0.1","created_by":"perceptron","source":"official","description":"Isaac-01 is a multimodal vision-language model from Perceptron for various vision language tasks.","status":"active","release_date":"2025-09-17","model_type":"other","page_url":"https://fal.run/perceptron/isaac-01","tagline":"Isaac-01 is a multimodal vision-language model from Perceptron for various vision language tasks.","capabilities":{"streaming":true,"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"pixelcut/background-removal","name":"Pixelcut Background Remover","created_by":"pixelcut","source":"official","description":"Pixelcut’s Background Remover enables fast, ultra high-quality removal of backgrounds from images.","status":"active","release_date":"2026-03-04","model_type":"image","page_url":"https://fal.run/pixelcut/background-removal","tagline":"Pixelcut’s Background Remover enables fast, ultra high-quality removal of backgrounds from images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-06-11","last_updated":"2026-06-18"},{"id":"pixelcut/video-background-removal","name":"Pixelcut Video Background Removal","created_by":"pixelcut","source":"official","description":"Pixelcut's Video Background Remover is an AI segmentation model that erases backgrounds frame by frame, with seamless temporal consistency.","status":"active","release_date":"2026-06-11","model_type":"other","page_url":"https://fal.run/pixelcut/video-background-removal","tagline":"Pixelcut's Video Background Remover is an AI segmentation model that erases backgrounds frame by frame, with seamless temporal consistency.","last_seen_at":"2026-06-12","last_updated":"2026-06-18"},{"id":"resemble-ai/chatterboxhd/speech-to-speech","name":"Chatterboxhd","created_by":"resemble-ai","source":"official","description":"Transform voices using Resemble AI's Chatterbox.","status":"active","release_date":"2025-06-02","model_type":"other","page_url":"https://fal.run/resemble-ai/chatterboxhd/speech-to-speech","tagline":"Transform voices using Resemble AI's Chatterbox.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"resemble-ai/chatterboxhd/text-to-speech","name":"Chatterboxhd","created_by":"resemble-ai","source":"official","description":"Generate expressive, natural speech with Resemble AI's Chatterbox.","status":"active","release_date":"2025-06-02","model_type":"tts","page_url":"https://fal.run/resemble-ai/chatterboxhd/text-to-speech","tagline":"Generate expressive, natural speech with Resemble AI's Chatterbox.","modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/juggernaut-flux/base/image-to-image","name":"Juggernaut Flux Base","created_by":"rundiffusion-fal","source":"official","description":"Juggernaut Base Flux by RunDiffusion is a drop-in replacement for Flux [Dev] that delivers sharper details, richer colors, and enhanced realism, while instantly boosting LoRAs and LyCORIS with full co","status":"active","release_date":"2025-03-05","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/juggernaut-flux/base/image-to-image","tagline":"Juggernaut Base Flux by RunDiffusion is a drop-in replacement for Flux [Dev] that delivers sharper details, richer colors, and enhanced realism, while instantly boosting LoRAs and LyCORIS with full co","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/juggernaut-flux/base","name":"Juggernaut Flux Base","created_by":"rundiffusion-fal","source":"official","description":"Juggernaut Base Flux by RunDiffusion is a drop-in replacement for Flux [Dev] that delivers sharper details, richer colors, and enhanced realism, while instantly boosting LoRAs and LyCORIS with full co","status":"active","release_date":"2025-03-05","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/juggernaut-flux/base","tagline":"Juggernaut Base Flux by RunDiffusion is a drop-in replacement for Flux [Dev] that delivers sharper details, richer colors, and enhanced realism, while instantly boosting LoRAs and LyCORIS with full co","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/juggernaut-flux/lightning","name":"Juggernaut Flux Lightning","created_by":"rundiffusion-fal","source":"official","description":"Juggernaut Lightning Flux by RunDiffusion provides blazing-fast, high-quality images rendered at five times the speed of Flux.","status":"active","release_date":"2025-03-05","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/juggernaut-flux/lightning","tagline":"Juggernaut Lightning Flux by RunDiffusion provides blazing-fast, high-quality images rendered at five times the speed of Flux.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/juggernaut-flux-lora/inpainting","name":"Juggernaut Flux Lora","created_by":"rundiffusion-fal","source":"official","description":"Juggernaut Base Flux LoRA Inpainting by RunDiffusion is a drop-in replacement for Flux [Dev] inpainting that delivers sharper details, richer colors, and enhanced realism to all your LoRAs and LyCORIS","status":"active","release_date":"2025-04-21","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/juggernaut-flux-lora/inpainting","tagline":"Juggernaut Base Flux LoRA Inpainting by RunDiffusion is a drop-in replacement for Flux [Dev] inpainting that delivers sharper details, richer colors, and enhanced realism to all your LoRAs and LyCORIS","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/juggernaut-flux-lora","name":"Juggernaut Flux Base LoRA","created_by":"rundiffusion-fal","source":"official","description":"Juggernaut Base Flux LoRA by RunDiffusion is a drop-in replacement for Flux [Dev] that delivers sharper details, richer colors, and enhanced realism to all your LoRAs and LyCORIS with full compatibili","status":"active","release_date":"2025-03-05","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/juggernaut-flux-lora","tagline":"Juggernaut Base Flux LoRA by RunDiffusion is a drop-in replacement for Flux [Dev] that delivers sharper details, richer colors, and enhanced realism to all your LoRAs and LyCORIS with full compatibili","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/juggernaut-flux/pro/image-to-image","name":"Juggernaut Flux Pro","created_by":"rundiffusion-fal","source":"official","description":"Juggernaut Pro Flux by RunDiffusion is the flagship Juggernaut model rivaling some of the most advanced image models available, often surpassing them in realism.","status":"active","release_date":"2025-03-05","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/juggernaut-flux/pro/image-to-image","tagline":"Juggernaut Pro Flux by RunDiffusion is the flagship Juggernaut model rivaling some of the most advanced image models available, often surpassing them in realism.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/juggernaut-flux/pro","name":"Juggernaut Flux Pro","created_by":"rundiffusion-fal","source":"official","description":"Juggernaut Pro Flux by RunDiffusion is the flagship Juggernaut model rivaling some of the most advanced image models available, often surpassing them in realism.","status":"active","release_date":"2025-03-05","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/juggernaut-flux/pro","tagline":"Juggernaut Pro Flux by RunDiffusion is the flagship Juggernaut model rivaling some of the most advanced image models available, often surpassing them in realism.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"rundiffusion-fal/rundiffusion-photo-flux","name":"Rundiffusion Photo Flux","created_by":"rundiffusion-fal","source":"official","description":"RunDiffusion Photo Flux provides insane realism.","status":"active","release_date":"2025-03-05","model_type":"image","page_url":"https://fal.run/rundiffusion-fal/rundiffusion-photo-flux","tagline":"RunDiffusion Photo Flux provides insane realism.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"smoretalk-ai/rembg-enhance","name":"Rembg Enhance (Remove Background Enhance)","created_by":"smoretalk-ai","source":"official","description":"Rembg-enhance is optimized for 2D vector images, 3D graphics, and photos by leveraging matting technology.","status":"active","release_date":"2025-05-09","model_type":"image","page_url":"https://fal.run/smoretalk-ai/rembg-enhance","tagline":"Rembg-enhance is optimized for 2D vector images, 3D graphics, and photos by leveraging matting technology.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-13","last_updated":"2026-06-03"},{"id":"sonauto/v2/extend","name":"Sonauto V2","created_by":"sonauto","source":"official","description":"Extend an existing song","status":"active","release_date":"2025-08-23","model_type":"other","page_url":"https://fal.run/sonauto/v2/extend","tagline":"Extend an existing song","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"sonauto/v2/inpaint","name":"Sonauto V2","created_by":"sonauto","source":"official","description":"Replace sections of an existing audio with newly generated content","status":"active","release_date":"2025-08-23","model_type":"other","page_url":"https://fal.run/sonauto/v2/inpaint","tagline":"Replace sections of an existing audio with newly generated content","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"sonauto/v2/text-to-music","name":"Sonauto V2","created_by":"sonauto","source":"official","description":"Create full songs in any style","status":"active","release_date":"2025-08-23","model_type":"other","page_url":"https://fal.run/sonauto/v2/text-to-music","tagline":"Create full songs in any style","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"sonilo/v1.1/text-to-music","name":"Sonilo V1.1 Text to Music","created_by":"sonilo","source":"official","description":"Generates production-ready music from a single text prompt, with full control over style, mood, instrumentation, and exact duration.","status":"active","release_date":"2026-06-03","model_type":"other","page_url":"https://fal.run/sonilo/v1.1/text-to-music","tagline":"Generates production-ready music from a single text prompt, with full control over style, mood, instrumentation, and exact duration.","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"sonilo/v1.1/video-to-music","name":"V1.1","created_by":"sonilo","source":"official","description":"Analyzes your video's pacing, mood, and timing to generate a frame-synced, commercial-ready soundtrack in seconds","status":"active","release_date":"2026-06-03","model_type":"other","page_url":"https://fal.run/sonilo/v1.1/video-to-music","tagline":"Analyzes your video's pacing, mood, and timing to generate a frame-synced, commercial-ready soundtrack in seconds","last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"tripo3d/h3.1/image-to-3d","name":"Tripo H3.1 Image to 3D","created_by":"tripo3d","source":"official","description":"Generate high-quality 3D models from a single image using Tripo H3.1.","status":"active","release_date":"2026-04-07","model_type":"other","page_url":"https://fal.run/tripo3d/h3.1/image-to-3d","tagline":"Generate high-quality 3D models from a single image using Tripo H3.1.","capabilities":{"vision":true},"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"tripo3d/h3.1/multiview-to-3d","name":"Tripo H3.1 Multiview to 3D","created_by":"tripo3d","source":"official","description":"Generate 3D models from multiple view images using Tripo H3.1.","status":"active","release_date":"2026-04-07","model_type":"other","page_url":"https://fal.run/tripo3d/h3.1/multiview-to-3d","tagline":"Generate 3D models from multiple view images using Tripo H3.1.","capabilities":{"vision":true},"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"tripo3d/h3.1/text-to-3d","name":"Tripo H3.1 Text to 3D","created_by":"tripo3d","source":"official","description":"Generate 3D models from text descriptions using Tripo H3.1.","status":"active","release_date":"2026-04-07","model_type":"other","page_url":"https://fal.run/tripo3d/h3.1/text-to-3d","tagline":"Generate 3D models from text descriptions using Tripo H3.1.","last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"tripo3d/p1/image-to-3d","name":"Tripo P1 Image to 3D","created_by":"tripo3d","source":"official","description":"Generate 3D models from a single image using Tripo P1.","status":"active","release_date":"2026-04-07","model_type":"other","page_url":"https://fal.run/tripo3d/p1/image-to-3d","tagline":"Generate 3D models from a single image using Tripo P1.","capabilities":{"vision":true},"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"tripo3d/p1/text-to-3d","name":"Tripo P1 Text to 3D","created_by":"tripo3d","source":"official","description":"Generate 3D models from text descriptions using Tripo P1.","status":"active","release_date":"2026-04-07","model_type":"other","page_url":"https://fal.run/tripo3d/p1/text-to-3d","tagline":"Generate 3D models from text descriptions using Tripo P1.","last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"tripo3d/tripo/v2.5/image-to-3d","name":"Tripo3D","created_by":"tripo3d","source":"official","description":"State of the art Image to 3D Object generation.","status":"active","release_date":"2025-04-25","model_type":"other","page_url":"https://fal.run/tripo3d/tripo/v2.5/image-to-3d","tagline":"State of the art Image to 3D Object generation.","capabilities":{"vision":true},"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"tripo3d/tripo/v2.5/multiview-to-3d","name":"Tripo3D","created_by":"tripo3d","source":"official","description":"State of the art Multiview to 3D Object generation.","status":"active","release_date":"2025-06-18","model_type":"other","page_url":"https://fal.run/tripo3d/tripo/v2.5/multiview-to-3d","tagline":"State of the art Multiview to 3D Object generation.","capabilities":{"vision":true},"last_seen_at":"2026-06-24","last_updated":"2026-06-29"},{"id":"tripo3d/triposplat","name":"Triposplat","created_by":"tripo3d","source":"official","description":"TripoSplat is an open-source model from TripoAI / VAST AI Research that converts a single 2D image into high-quality 3D Gaussians using a novel learned density-control approach","status":"active","release_date":"2026-06-03","model_type":"other","page_url":"https://fal.run/tripo3d/triposplat","tagline":"TripoSplat is an open-source model from TripoAI / VAST AI Research that converts a single 2D image into high-quality 3D Gaussians using a novel learned density-control approach","capabilities":{"vision":true},"last_seen_at":"2026-06-03","last_updated":"2026-06-10"},{"id":"veed/avatars/audio-to-video","name":"Avatars","created_by":"veed","source":"official","description":"Generate high-quality videos with UGC-like avatars from audio","status":"active","release_date":"2025-05-28","model_type":"other","page_url":"https://fal.run/veed/avatars/audio-to-video","tagline":"Generate high-quality videos with UGC-like avatars from audio","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"veed/avatars/text-to-video","name":"Avatars","created_by":"veed","source":"official","description":"Generate high-quality videos with UGC-like avatars from text","status":"active","release_date":"2025-05-28","model_type":"video","page_url":"https://fal.run/veed/avatars/text-to-video","tagline":"Generate high-quality videos with UGC-like avatars from text","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"veed/fabric-1.0/fast","name":"Fabric 1.0 Fast","created_by":"veed","source":"official","description":"VEED Fabric 1.0 is an image-to-video API that turns any image into a talking video","status":"active","release_date":"2025-10-01","model_type":"video","page_url":"https://fal.run/veed/fabric-1.0/fast","tagline":"VEED Fabric 1.0 is an image-to-video API that turns any image into a talking video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-23","last_updated":"2026-05-11"},{"id":"veed/fabric-1.0/text","name":"Fabric 1.0","created_by":"veed","source":"official","description":"VEED Fabric 1.0 text-to-video API","status":"active","release_date":"2025-12-12","model_type":"video","page_url":"https://fal.run/veed/fabric-1.0/text","tagline":"VEED Fabric 1.0 text-to-video API","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-23","last_updated":"2026-05-11"},{"id":"veed/fabric-1.0","name":"Fabric 1.0","created_by":"veed","source":"official","description":"VEED Fabric 1.0 is an image-to-video API that turns any image into a talking video","status":"active","release_date":"2025-09-19","model_type":"video","page_url":"https://fal.run/veed/fabric-1.0","tagline":"VEED Fabric 1.0 is an image-to-video API that turns any image into a talking video","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-23","last_updated":"2026-05-11"},{"id":"veed/lipsync","name":"Lipsync","created_by":"veed","source":"official","description":"Generate realistic lipsync from any audio using VEED's latest model","status":"active","release_date":"2025-05-28","model_type":"other","page_url":"https://fal.run/veed/lipsync","tagline":"Generate realistic lipsync from any audio using VEED's latest model","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"veed/subtitles","name":"Subtitles","created_by":"veed","source":"official","description":"VEED’s Subtitles API transforms raw footage into polished, publish-ready content with professional burned-in subtitles starting at a base rate of $0.10 per minute.","status":"active","release_date":"2026-05-11","model_type":"other","page_url":"https://fal.run/veed/subtitles","tagline":"VEED’s Subtitles API transforms raw footage into polished, publish-ready content with professional burned-in subtitles starting at a base rate of $0.10 per minute.","last_seen_at":"2026-06-11","last_updated":"2026-06-18"},{"id":"veed/video-background-removal/fast","name":"Video Background Removal","created_by":"veed","source":"official","description":"Remove background from any video with people and objects.","status":"active","release_date":"2025-12-01","model_type":"other","page_url":"https://fal.run/veed/video-background-removal/fast","tagline":"Remove background from any video with people and objects.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"veed/video-background-removal/green-screen","name":"Video Background Removal","created_by":"veed","source":"official","description":"Remove background from videos filmed using chromakey, with automatic green spill suppression for clean, professional edges.","status":"active","release_date":"2025-11-28","model_type":"other","page_url":"https://fal.run/veed/video-background-removal/green-screen","tagline":"Remove background from videos filmed using chromakey, with automatic green spill suppression for clean, professional edges.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"veed/video-background-removal","name":"Video Background Removal","created_by":"veed","source":"official","description":"Remove background from any video with people and objects.","status":"active","release_date":"2025-11-28","model_type":"other","page_url":"https://fal.run/veed/video-background-removal","tagline":"Remove background from any video with people and objects.","last_seen_at":"2026-01-26","last_updated":"2026-05-11"},{"id":"wan/v2.6/image-to-image","name":"Wan v2.6 Image to Image","created_by":"wan","source":"official","description":"Wan 2.6 image-to-image model.","status":"active","release_date":"2025-12-23","model_type":"image","page_url":"https://fal.run/wan/v2.6/image-to-image","tagline":"Wan 2.6 image-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"wan/v2.6/image-to-video/flash","name":"V2.6","created_by":"wan","source":"official","description":"Wan 2.6 image-to-video flash model.","status":"active","release_date":"2026-01-18","model_type":"video","page_url":"https://fal.run/wan/v2.6/image-to-video/flash","tagline":"Wan 2.6 image-to-video flash model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"wan/v2.6/image-to-video","name":"Wan v2.6 Image to Video","created_by":"wan","source":"official","description":"Wan 2.6 image-to-video model.","status":"active","release_date":"2025-12-15","model_type":"video","page_url":"https://fal.run/wan/v2.6/image-to-video","tagline":"Wan 2.6 image-to-video model.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"wan/v2.6/reference-to-video/flash","name":"V2.6","created_by":"wan","source":"official","description":"Wan 2.6 reference-to-video flash model.","status":"active","release_date":"2026-02-06","model_type":"other","page_url":"https://fal.run/wan/v2.6/reference-to-video/flash","tagline":"Wan 2.6 reference-to-video flash model.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"wan/v2.6/reference-to-video","name":"Wan v2.6 Reference to Video","created_by":"wan","source":"official","description":"Wan 2.6 reference-to-video model.","status":"active","release_date":"2025-12-16","model_type":"other","page_url":"https://fal.run/wan/v2.6/reference-to-video","tagline":"Wan 2.6 reference-to-video model.","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"wan/v2.6/text-to-image","name":"Wan v2.6 Text to Image","created_by":"wan","source":"official","description":"Wan 2.6 text-to-image model.","status":"active","release_date":"2025-12-23","model_type":"image","page_url":"https://fal.run/wan/v2.6/text-to-image","tagline":"Wan 2.6 text-to-image model.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-20","last_updated":"2026-05-11"},{"id":"wan/v2.6/text-to-video","name":"Wan v2.6 Text to Video","created_by":"wan","source":"official","description":"Wan 2.6 text-to-video model.","status":"active","release_date":"2025-12-16","model_type":"video","page_url":"https://fal.run/wan/v2.6/text-to-video","tagline":"Wan 2.6 text-to-video model.","modalities":{"input":["text"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-image/edit","name":"Grok Imagine Image","created_by":"xai","source":"official","family":"grok-imagine","description":"Edit images precisely with xAI's Grok Imagine model","status":"active","release_date":"2026-01-29","model_type":"image","page_url":"https://fal.run/xai/grok-imagine-image/edit","tagline":"Edit images precisely with xAI's Grok Imagine model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-image/quality/edit","name":"Grok Imagine Image Editing Quality","created_by":"xai","source":"official","family":"grok-imagine","description":"Grok Imagine Pro is an advanced AI model from xAI that creates high-quality visuals from text prompts and allows you to edit or analyze existing images.","status":"active","release_date":"2026-04-09","model_type":"image","page_url":"https://fal.run/xai/grok-imagine-image/quality/edit","tagline":"Grok Imagine Pro is an advanced AI model from xAI that creates high-quality visuals from text prompts and allows you to edit or analyze existing images.","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-image/quality/text-to-image","name":"Grok Imagine Image","created_by":"xai","source":"official","family":"grok-imagine","description":"Grok Imagine Pro is an advanced AI model from xAI that creates high-quality visuals from text prompts and allows you to edit or analyze existing images.","status":"active","release_date":"2026-04-09","model_type":"image","page_url":"https://fal.run/xai/grok-imagine-image/quality/text-to-image","tagline":"Grok Imagine Pro is an advanced AI model from xAI that creates high-quality visuals from text prompts and allows you to edit or analyze existing images.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-05-07","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-image","name":"Grok Imagine Image","created_by":"xai","source":"official","family":"grok-imagine","description":"Generate highly aesthetic images with xAI's Grok Imagine Image generation model.","status":"active","release_date":"2026-01-29","model_type":"image","page_url":"https://fal.run/xai/grok-imagine-image","tagline":"Generate highly aesthetic images with xAI's Grok Imagine Image generation model.","capabilities":{"vision":true,"streaming":true,"tool_call":true,"batch":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11","license":"proprietary","open_weight":false},{"id":"xai/grok-imagine-video/edit-video","name":"Grok Imagine Video","created_by":"xai","source":"official","family":"grok-imagine","description":"Edit videos using xAI's Grok Imagine","status":"active","release_date":"2026-01-29","model_type":"other","page_url":"https://fal.run/xai/grok-imagine-video/edit-video","tagline":"Edit videos using xAI's Grok Imagine","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-video/extend-video","name":"Grok Imagine Extend Video","created_by":"xai","source":"official","family":"grok-imagine","description":"Extend videos with xAI's Grok Imagine video model","status":"active","release_date":"2026-03-24","model_type":"other","page_url":"https://fal.run/xai/grok-imagine-video/extend-video","tagline":"Extend videos with xAI's Grok Imagine video model","last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-video/image-to-video","name":"Grok Imagine Video","created_by":"xai","source":"official","family":"grok-imagine","description":"Generate videos from images with audio using xAI's Grok Imagine Video model.","status":"active","release_date":"2026-01-29","model_type":"video","page_url":"https://fal.run/xai/grok-imagine-video/image-to-video","tagline":"Generate videos from images with audio using xAI's Grok Imagine Video model.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-video/reference-to-video","name":"Grok Imagine Reference to Video","created_by":"xai","source":"official","family":"grok-imagine","description":"Generate videos using multiple reference images with xAI's Grok Imagine video model","status":"active","release_date":"2026-03-24","model_type":"video","page_url":"https://fal.run/xai/grok-imagine-video/reference-to-video","tagline":"Generate videos using multiple reference images with xAI's Grok Imagine video model","capabilities":{"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-video/text-to-video","name":"Grok Imagine Video","created_by":"xai","source":"official","family":"grok-imagine","description":"Generate videos with audio from text using Grok Imagine Video.","status":"active","release_date":"2026-01-29","model_type":"video","page_url":"https://fal.run/xai/grok-imagine-video/text-to-video","tagline":"Generate videos with audio from text using Grok Imagine Video.","modalities":{"input":["text","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-04-26","last_updated":"2026-05-11"},{"id":"xai/grok-imagine-video/v1.5/image-to-video","name":"Grok Imagine Video 1.5","created_by":"xai","source":"official","family":"grok-imagine","description":"Generate videos from images with audio using xAI's Grok Imagine 1.5 Video model.","status":"active","release_date":"2026-05-31","model_type":"video","page_url":"https://fal.run/xai/grok-imagine-video/v1.5/image-to-video","tagline":"Generate videos from images with audio using xAI's Grok Imagine 1.5 Video model.","capabilities":{"vision":true},"modalities":{"input":["text","image","audio"],"output":["video"]},"endpoints":["video"],"last_seen_at":"2026-06-02","last_updated":"2026-06-03"},{"id":"xai/tts/v1","name":"xAI Text to Speech","created_by":"xai","source":"official","family":"tts","description":"Generate speech with expressive and realistic voices from xAI","status":"active","release_date":"2026-03-17","model_type":"tts","page_url":"https://fal.run/xai/tts/v1","tagline":"Generate speech with expressive and realistic voices from xAI","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["audio"]},"endpoints":["audio_speech"],"last_seen_at":"2026-06-02","last_updated":"2026-06-03"}]}; export const models: Model[] = provider.models.map((m) => ({ ...m, provider: provider.id })); diff --git a/packages/npm/src/providers/google.ts b/packages/npm/src/providers/google.ts index 10354c6ac..32e696a06 100644 --- a/packages/npm/src/providers/google.ts +++ b/packages/npm/src/providers/google.ts @@ -3,6 +3,6 @@ import type { ProviderWithModels, Model } from '../types'; -export const provider: ProviderWithModels = {"id":"google","name":"Google AI","region":"US","headquarters":"Mountain View, CA","founded":2010,"url":"https://ai.google.dev","api_url":"https://generativelanguage.googleapis.com/v1beta","docs_url":"https://ai.google.dev/docs","pricing_url":"https://ai.google.dev/pricing","description":"Google AI Studio provides access to Gemini models for developers building with the Gemini API.","type":"direct","playground_url":"https://aistudio.google.com","status_url":"https://status.cloud.google.com","sdk":{"python":"google-genai","javascript":"@google/genai"},"openai_compatible":true,"free_tier":true,"github_url":"https://github.com/google-gemini","models_url":"https://ai.google.dev/gemini-api/docs/models","twitter_url":"https://x.com/GoogleDeepMind","blog_url":"https://deepmind.google/blog","terms_url":"https://ai.google.dev/gemini-api/terms","support_url":"https://ai.google.dev/gemini-api/docs/troubleshoot-ai-studio","icon":"\n \n \n \n \n","models":[{"id":"antigravity-preview-05-2026","name":"antigravity-preview-05-2026","created_by":"google","source":"official","status":"active","context_window":1048576,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/antigravity-preview-05-2026","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"open_weight":false,"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-05-23"},{"id":"deep-research-max-preview-04-2026","name":"deep-research-max-preview-04-2026","created_by":"google","source":"official","family":"deep-research","status":"active","context_window":1048576,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/deep-research-max-preview-04-2026","model_type":"reasoning","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"open_weight":false,"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-04-22"},{"id":"deep-research-preview-04-2026","name":"deep-research-preview-04-2026","created_by":"google","source":"official","family":"deep-research","status":"active","context_window":1048576,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/deep-research-preview-04-2026","model_type":"reasoning","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"open_weight":false,"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-04-22"},{"id":"deep-research-pro-preview-12-2025","name":"deep-research-pro-preview-12-2025","created_by":"google","source":"official","last_updated":"2026-04-22","status":"active","context_window":1048576,"max_output_tokens":65536,"model_type":"reasoning","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"deep-research","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/deep-research-pro-preview-12-2025","open_weight":false},{"id":"embedding-001","name":"embedding-001","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","successor":"gemini-embedding-2","model_type":"embed","modalities":{"input":["text"],"output":["text"]},"family":"embed","license":"proprietary","open_weight":false},{"id":"embedding-gecko-001","name":"embedding-gecko-001","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","successor":"gemini-embedding-2","model_type":"embed","modalities":{"input":["text"],"output":["text"]},"family":"embed","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-001","name":"gemini-2.0-flash-001","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.5-flash"},{"id":"gemini-2.0-flash-lite-001","name":"gemini-2.0-flash-lite-001","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.1-flash-lite"},{"id":"gemini-2.0-flash-lite-preview-02-05","name":"gemini-2.0-flash-lite-preview-02-05","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-2.5-flash-lite","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-lite-preview","name":"gemini-2.0-flash-lite-preview","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-2.5-flash-lite","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-lite","name":"gemini-2.0-flash-lite","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","knowledge_cutoff":"2024-08","context_window":1048576,"max_output_tokens":8192,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.075,"output":0.3,"batch_input":0.0375,"batch_output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.075,null,0.3]},{"label":"Batch","values":[0.0375,null,0.15]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.0-flash-lite","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.1-flash-lite"},{"id":"gemini-2.0-flash-live-001","name":"gemini-2.0-flash-live-001","created_by":"google","source":"official","last_updated":"2026-03-27","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-3.1-flash-live-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-preview-image-generation","name":"gemini-2.0-flash-preview-image-generation","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-11-14","successor":"gemini-2.5-flash-image","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash","name":"gemini-2.0-flash","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","knowledge_cutoff":"2024-08","context_window":1048576,"max_output_tokens":8192,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.1,"output":0.4,"cached_input":0.025,"batch_input":0.05,"batch_output":0.2,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.1,0.025,0.4]},{"label":"Batch","values":[0.05,null,0.2]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.0-flash","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.5-flash"},{"id":"gemini-2.5-computer-use-preview-10-2025","name":"gemini-2.5-computer-use-preview-10-2025","created_by":"google","source":"official","last_updated":"2026-04-22","family":"gemini-2.5","status":"active","context_window":128000,"max_output_tokens":64000,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":10,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.25,null,10]},{"label":"Batch","values":[null,null,null]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-computer-use-preview-10-2025","open_weight":false},{"id":"gemini-2.5-flash-image-preview","name":"gemini-2.5-flash-image-preview","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2026-01-15","successor":"gemini-2.5-flash-image","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-image","name":"gemini-2.5-flash-image","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-06","context_window":65536,"max_output_tokens":32768,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":0.039,"batch_input":0.15,"batch_output":0.0195,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,0.039]},{"label":"Batch","values":[0.15,null,0.0195]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash-image","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Image (Nano Banana) Our best engine for high-velocity visual creation, offering state-of-the-art speed and efficiency. Gemini 2.5 Flash Image, also known as Nano Banana, is best for high-volume generation, conversational image editing, and low-latency creative workflows that require native multimodal understanding.","tagline":"Our best engine for high-velocity visual creation, offering state-of-the-art speed and efficiency."},{"id":"gemini-2.5-flash-lite-preview-09-2025","name":"gemini-2.5-flash-lite-preview-09-2025","created_by":"google","source":"official","last_updated":"2026-05-10","family":"gemini-2.5","status":"deprecated","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash-lite-preview-09-2025","open_weight":false,"deprecation_date":"2026-03-31","successor":"gemini-3.1-flash-lite"},{"id":"gemini-2.5-flash-lite","name":"gemini-2.5-flash-lite","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.1,"output":0.4,"cached_input":0.01,"batch_input":0.05,"batch_output":0.2,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.1,0.01,0.4]},{"label":"Batch","values":[0.05,null,0.2]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash-lite","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash-Lite Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks. Gemini 2.5 Flash-Lite is best for high-volume classification, simple data extraction, and extremely low-latency applications where budget and speed are the primary constraints.","tagline":"Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks."},{"id":"gemini-2.5-flash-native-audio-preview-12-2025","name":"gemini-2.5-flash-native-audio-preview-12-2025","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":8192,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash-native-audio-preview-12-2025","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Live Preview The Live API enables low-latency, real-time voice and video interactions with Gemini 2.5 Flash. It processes continuous streams of audio, video, or text to deliver immediate, human-like spoken responses, creating a natural conversational experience for your users.","tagline":"The Live API enables low-latency, real-time voice and video interactions with Gemini 2.5 Flash."},{"id":"gemini-2.5-flash-preview-05-20","name":"gemini-2.5-flash-preview-05-20","created_by":"google","source":"official","last_updated":"2026-05-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-11-18","successor":"gemini-3.5-flash","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-preview-09-2025","name":"gemini-2.5-flash-preview-09-2025","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash-preview-09-2025","open_weight":false},{"id":"gemini-2.5-flash-preview-09-25","name":"gemini-2.5-flash-preview-09-25","created_by":"google","source":"official","last_updated":"2026-05-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2026-02-17","successor":"gemini-3.5-flash","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-preview-tts","name":"gemini-2.5-flash-preview-tts","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","context_window":8192,"max_output_tokens":16384,"model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":0.5,"output":10,"batch_input":0.25,"batch_output":5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.5,null,10]},{"label":"Batch","values":[0.25,null,5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash-preview-tts","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Text-to-Speech Our fastest engine for high-fidelity speech synthesis, offering low-latency and cost-efficient audio generation. Gemini 2.5 Flash TTS is best for real-time assistants, high-volume narration, and conversational use cases that require fine-grained control over voice style and pacing.","tagline":"Our fastest engine for high-fidelity speech synthesis, offering low-latency and cost-efficient audio generation."},{"id":"gemini-2.5-flash","name":"gemini-2.5-flash","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":2.5,"cached_input":0.03,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,0.03,2.5]},{"label":"Batch","values":[0.15,null,1.25]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Our best model in terms of price-performance, offering well-rounded capabilities. 2.5 Flash is best for large scale processing, low-latency, high volume tasks that require thinking, and agentic use cases.","tagline":"Our best model in terms of price-performance, offering well-rounded capabilities."},{"id":"gemini-2.5-pro-preview-03-25","name":"gemini-2.5-pro-preview-03-25","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-12-02","successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-pro-preview-05-06","name":"gemini-2.5-pro-preview-05-06","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-12-02","successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-pro-preview-06-05","name":"gemini-2.5-pro-preview-06-05","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-12-02","successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-pro-preview-tts","name":"gemini-2.5-pro-preview-tts","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","context_window":8192,"max_output_tokens":16384,"model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":1,"output":20,"batch_input":0.5,"batch_output":10,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1,null,20]},{"label":"Batch","values":[0.5,null,10]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-pro-preview-tts","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Pro Text-to-Speech Our premium engine for studio-quality speech synthesis, offering high-fidelity and sophisticated audio generation. Gemini 2.5 Pro TTS is best for long-form content, professional narrations, and complex creative workflows that require the highest level of vocal clarity and natural prosody.","tagline":"Our premium engine for studio-quality speech synthesis, offering high-fidelity and sophisticated audio generation."},{"id":"gemini-2.5-pro","name":"gemini-2.5-pro","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":1.25,"output":10,"cached_input":0.125,"batch_input":0.625,"batch_output":5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.25,0.125,10]},{"label":"Batch","values":[0.625,null,5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-pro","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Pro Our state-of-the-art thinking model, capable of reasoning over complex problems in code, math, and STEM, as well as analyzing large datasets, codebases, and documents using long context.","tagline":"Our state-of-the-art thinking model, capable of reasoning over complex problems in code, math, and STEM, as well as analyzing large datasets, codebases, and documents using long context."},{"id":"gemini-3-flash-preview","name":"gemini-3-flash-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.5,"output":3,"cached_input":0.05,"batch_input":0.25,"batch_output":1.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.5,0.05,3]},{"label":"Batch","values":[0.25,null,1.5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3-flash-preview","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3 Flash Preview The best model in the world for multimodal understanding, and our most powerful agentic and vibe-coding model yet, delivering richer visuals and deeper interactivity, all built on a foundation of state-of-the-art reasoning.","tagline":"The best model in the world for multimodal understanding, and our most powerful agentic and vibe-coding model yet, delivering richer visuals and deeper interactivity, all built on a foundation of stat"},{"id":"gemini-3-pro-image-preview","name":"gemini-3-pro-image-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3","status":"deprecated","knowledge_cutoff":"2025-01","context_window":65536,"max_output_tokens":32768,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":2,"output":12,"batch_input":1,"batch_output":6,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[2,null,12]},{"label":"Batch","values":[1,null,6]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3-pro-image-preview","open_weight":false,"deprecation_date":"2026-06-25","successor":"gemini-3-pro-image"},{"id":"gemini-3-pro-image","name":"gemini-3-pro-image","created_by":"google","source":"official","family":"gemini-3","status":"active","knowledge_cutoff":"2025-01","context_window":65536,"max_output_tokens":32768,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3-pro-image","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":2,"output":12,"batch_input":1,"batch_output":6,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[2,null,12]},{"label":"Batch","values":[1,null,6]}]}]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3 Pro Image Nano Banana Pro is a sophisticated reasoning-driven engine for professional-grade image editing and generation, offering studio-quality precision and advanced creative control. Nano Banana Pro is best for complex graphic design, high-fidelity product mockups, and factual data visualizations that require accurate text rendering and real-world grounding via Google Search.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3-pro-preview","name":"gemini-3-pro-preview","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-3","status":"deprecated","deprecation_date":"2026-03-09","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3-pro-preview","open_weight":false},{"id":"gemini-3.1-flash-image-preview","name":"gemini-3.1-flash-image-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3.1","status":"deprecated","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":32768,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.5,"output":3,"batch_input":0.25,"batch_output":1.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.5,null,3]},{"label":"Batch","values":[0.25,null,1.5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-image-preview","open_weight":false,"deprecation_date":"2026-06-25","successor":"gemini-3.1-flash-image"},{"id":"gemini-3.1-flash-image","name":"gemini-3.1-flash-image","created_by":"google","source":"official","family":"gemini-3.1","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":32768,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-image","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":0.5,"output":3,"batch_input":0.25,"batch_output":1.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.5,null,3]},{"label":"Batch","values":[0.25,null,1.5]}]}]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash Image Nano Banana 2 provides high-quality image generation and conversational editing at a mainstream price point and low latency. It serves as the high-efficiency counterpart to Gemini 3 Pro Image , optimized for speed and high-volume developer use cases. Key updates: New output resolution options: New support for 0.5K, 2K and 4K, default 1K New Image Search Grounding: Integration of both text and image search results to inform generation with real-time web data Supported with Thinking on or off New 1:4, 4:1, 1:8 and 8:1 aspect ratios Improved aspect ratio adherence Improved image quality and consistency Improved i18n text rendering","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.1-flash-lite-preview","name":"gemini-3.1-flash-lite-preview","created_by":"google","source":"official","last_updated":"2026-05-29","family":"gemini-3.1","status":"deprecated","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.25,"output":1.5,"cached_input":0.025,"batch_input":0.125,"batch_output":0.75,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.25,0.025,1.5]},{"label":"Batch","values":[0.125,null,0.75]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-lite-preview","open_weight":false,"description":"Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks. Gemini 3.1 Flash-Lite is best for high-volume agentic tasks, simple data extraction, and extremely low-latency applications where budget and speed are the primary constraints.","tagline":"Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks.","deprecation_date":"2026-05-25","successor":"gemini-3.1-flash-lite"},{"id":"gemini-3.1-flash-lite","name":"gemini-3.1-flash-lite","created_by":"google","source":"official","family":"gemini-3.1","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash-Lite Gemini 3.1 Flash-Lite is a low-latency, cost-effective multimodal model optimized for high-frequency, lightweight tasks. The model supports text, image, video, audio, and PDF inputs, and is designed for high-volume agentic workflows, simple data extraction, and applications where latency and API cost are the primary constraints.","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-lite","model_type":"chat","tagline":"The model supports text, image, video, audio, and PDF inputs, and is designed for high-volume agentic workflows, simple data extraction, and applications where latency and API cost are the primary con","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.25,"output":1.5,"cached_input":0.025,"batch_input":0.125,"batch_output":0.75,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.25,0.025,1.5]},{"label":"Batch","values":[0.125,null,0.75]}]}]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29"},{"id":"gemini-3.1-flash-live-preview","name":"gemini-3.1-flash-live-preview","created_by":"google","source":"official","family":"gemini-3.1","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-live-preview","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.75,"output":4.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.75,null,4.5]}]}]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash Live Preview Gemini 3.1 Flash Live Preview is our low-latency, audio-to-audio model optimized for real-time dialogue and voice-first AI applications with acoustic nuance detection, numeric precision, and multimodal awareness.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.1-flash-tts-preview","name":"gemini-3.1-flash-tts-preview","created_by":"google","source":"official","family":"gemini-3.1","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash TTS (Text-to-Speech) Preview The Gemini 3.1 Flash TTS Preview model provides powerful, low-latency speech generation with natural outputs, steerable prompts, and new expressive audio tags for precise narration control.","status":"active","knowledge_cutoff":"2025-01","context_window":8192,"max_output_tokens":16384,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-tts-preview","model_type":"tts","tagline":"The Gemini 3.1 Flash TTS Preview model provides powerful, low-latency speech generation with natural outputs, steerable prompts, and new expressive audio tags for precise narration control.","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":1,"output":20,"batch_input":0.5,"batch_output":10,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1,null,20]},{"label":"Batch","values":[0.5,null,10]}]}]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29"},{"id":"gemini-3.1-pro-preview","name":"gemini-3.1-pro-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3.1","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":2,"output":12,"cached_input":0.2,"batch_input":1,"batch_output":6,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[2,0.2,12]},{"label":"Batch","values":[1,null,6]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.1-pro-preview","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Pro Preview Built to refine the performance and reliability of the Gemini 3 Pro series, Gemini 3.1 Pro Preview provides better thinking, improved token efficiency, and a more grounded, factually consistent experience. It's optimized for software engineering behavior and usability, as well as agentic workflows requiring precise tool usage and reliable multi-step execution across real-world domains.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.5-flash","name":"gemini-3.5-flash","created_by":"google","source":"official","family":"gemini-3.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.5-flash","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":1.5,"output":9,"cached_input":0.15,"batch_input":0.75,"batch_output":4.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.5,0.15,9]},{"label":"Batch","values":[0.75,null,4.5]}]}]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.5 Flash Gemini 3.5 Flash provides sustained frontier-level intelligence optimized for real-world tasks at a higher speed and lower cost. Designed for the agentic era, it excels at sub-agent deployment, multi-step workflows, and long-horizon tasks at scale. This model is particularly effective for rapid agentic loops involving complex coding cycles and iterations.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.5-live-translate-preview","name":"gemini-3.5-live-translate-preview","created_by":"google","source":"official","family":"gemini-3.5","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.5-live-translate-preview","model_type":"translation","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":3.5,"output":21,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[3.5,null,21]}]}]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.5 Live Translate Gemini 3.5 Live Translate is our low-latency, audio-to-audio model optimized for real-time translation of spoken conversations. It enables seamless, bidirectional translation with high accuracy and natural voice output.","tagline":"The Interactions API is now generally available."},{"id":"gemini-embedding-001","name":"gemini-embedding-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","context_window":2048,"model_type":"embed","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"family":"gemini-embedding","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-embedding-001","open_weight":false},{"id":"gemini-embedding-2-preview","name":"gemini-embedding-2-preview","created_by":"google","source":"official","last_updated":"2026-03-23","status":"active","context_window":8192,"model_type":"embed","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"family":"gemini-embedding","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-embedding-2-preview","open_weight":false},{"id":"gemini-embedding-2","name":"gemini-embedding-2","created_by":"google","source":"official","family":"gemini-embedding","status":"active","context_window":8192,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-embedding-2","model_type":"embed","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.2,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.2,null,null]},{"label":"Batch","values":[0.1,null,null]}]}],"batch_input":0.1},"open_weight":false,"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-05-29"},{"id":"gemini-embedding-exp-03-07","name":"gemini-embedding-exp-03-07","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","successor":"gemini-embedding-2","model_type":"embed","modalities":{"input":["text"],"output":["text"]},"family":"gemini-embedding","license":"proprietary","open_weight":false},{"id":"gemini-embedding-exp","name":"gemini-embedding-exp","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","successor":"gemini-embedding-2","model_type":"embed","modalities":{"input":["text"],"output":["text"]},"family":"gemini-embedding","license":"proprietary","open_weight":false},{"id":"gemini-live-2.5-flash-preview","name":"gemini-live-2.5-flash-preview","created_by":"google","source":"official","last_updated":"2026-03-27","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-3.1-flash-live-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"family":"gemini-2.5","model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-robotics-er-1.5-preview","name":"gemini-robotics-er-1.5-preview","created_by":"google","source":"official","last_updated":"2026-06-29","status":"deprecated","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"gemini-1.5","model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-robotics-er-1.5-preview","open_weight":false,"deprecation_date":"2026-04-30","successor":"gemini-robotics-er-1.6-preview","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini Robotics-ER 1.5 Note: This version is planned for deprecation soon . See the models page for the latest model version. Gemini Robotics-ER 1.5 is a vision-language model (VLM) that brings Gemini's agentic capabilities to robotics. It's designed for advanced reasoning in the physical world, allowing robots to interpret complex visual data, perform spatial reasoning, and plan actions from natural language commands.","tagline":"The Interactions API is now generally available."},{"id":"gemini-robotics-er-1.6-preview","name":"gemini-robotics-er-1.6-preview","created_by":"google","source":"official","family":"gemini-1.6","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-robotics-er-1.6-preview","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini Robotics-ER 1.6 Gemini Robotics-ER 1.6 is a vision-language model (VLM) that brings Gemini's agentic capabilities to robotics. It's designed for advanced reasoning in the physical world, allowing robots to interpret complex visual data, perform spatial reasoning, and plan actions from natural language commands.","tagline":"The Interactions API is now generally available."},{"id":"imagen-3.0-generate-002","name":"imagen-3.0-generate-002","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2025-11-10","successor":"imagen-4.0-generate-001","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-3.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-fast-generate-001","name":"imagen-4.0-fast-generate-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-generate-001","name":"imagen-4.0-generate-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-generate-preview-06-06","name":"imagen-4.0-generate-preview-06-06","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2026-02-17","successor":"imagen-4.0-generate-001","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-ultra-generate-001","name":"imagen-4.0-ultra-generate-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-ultra-generate-preview-06-06","name":"imagen-4.0-ultra-generate-preview-06-06","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2026-02-17","successor":"imagen-4.0-ultra-generate-001","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen","name":"imagen","created_by":"google","source":"official","last_updated":"2026-06-29","status":"active","context_window":480,"model_type":"image","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["image"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"imagen","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/imagen","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Imagen 4 The Imagen 4 standard, ultra, and fast endpoints are deprecated and will be shut down on **August 17, 2026**; migrate to Gemini 3.1 Flash Image to avoid service interruptions. A high-performance engine for advanced visual synthesis, offering sophisticated creative control and photorealistic output. Use Imagen 4 for professional branding, intricate scene composition, and high-fidelity design tasks that require precise text rendering and complex lighting.","tagline":"A high-performance engine for advanced visual synthesis, offering sophisticated creative control and photorealistic output."},{"id":"lyria-3-clip-preview","name":"lyria-3-clip-preview","created_by":"google","source":"official","status":"active","context_window":131072,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/lyria-3-clip-preview","model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["audio"]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Lyria 3 Clip Preview Lyria 3 Clip Preview is Google's model optimized for generating short musical clips, loops, and previews. It generates 30-second high-quality, 48kHz stereo audio from text prompts or image inputs.","tagline":"The Interactions API is now generally available."},{"id":"lyria-3-pro-preview","name":"lyria-3-pro-preview","created_by":"google","source":"official","status":"active","context_window":131072,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/lyria-3-pro-preview","model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["audio"]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Lyria 3 Pro Preview Lyria 3 Pro Preview is Google's flagship music generation model. It is optimized for generating full-length songs with complex structural coherence, including multiple verses, choruses, and bridges. It generates high-quality, 48kHz stereo audio from text prompts or image inputs.","tagline":"The Interactions API is now generally available."},{"id":"lyria-realtime-exp","name":"lyria-realtime-exp","created_by":"google","source":"official","last_updated":"2026-03-24","status":"active","model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/lyria-realtime-exp","open_weight":false},{"id":"text-embedding-004","name":"text-embedding-004","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2026-01-14","successor":"gemini-embedding-2","model_type":"embed","modalities":{"input":["text"],"output":["text"]},"family":"text-embedding","license":"proprietary","open_weight":false},{"id":"veo-2.0-generate-001","name":"veo-2.0-generate-001","created_by":"google","source":"official","last_updated":"2026-06-29","status":"active","model_type":"video","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["video"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"veo-2.0","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/veo-2.0-generate-001","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 2.0 This model is deprecated and will be shut down on **June 30, 2026**; migrate to Veo 3.1 Preview or the GA models available through the Gemini Enterprise Agent Platform to avoid service interruptions. Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows. Veo 2.0 is best for standard 1080p content creation, social media assets, and high-volume video tasks that prioritize reliable character consistency and predictable sub-second generation speeds.","tagline":"Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows."},{"id":"veo-3.0-fast-generate-001","name":"veo-3.0-fast-generate-001","created_by":"google","source":"official","family":"veo-3.0","status":"active","license":"proprietary","model_type":"video","modalities":{"input":["text"],"output":["video"]},"open_weight":false,"last_updated":"2026-06-18"},{"id":"veo-3.0-fast-generate-preview","name":"veo-3.0-fast-generate-preview","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2025-11-12","successor":"veo-3.1-fast-generate-preview","model_type":"video","modalities":{"input":["text"],"output":["video"]},"family":"veo-3.0","license":"proprietary","open_weight":false},{"id":"veo-3.0-generate-001","name":"veo-3.0-generate-001","created_by":"google","source":"official","family":"veo-3.0","status":"active","license":"proprietary","model_type":"video","modalities":{"input":["text"],"output":["video"]},"open_weight":false,"last_updated":"2026-06-18"},{"id":"veo-3.0-generate-preview","name":"veo-3.0-generate-preview","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2025-11-12","successor":"veo-3.1-generate-preview","model_type":"video","modalities":{"input":["text"],"output":["video"]},"family":"veo-3.0","license":"proprietary","open_weight":false},{"id":"veo-3.1-fast-generate-preview","name":"veo-3.1-fast-generate-preview","created_by":"google","source":"official","family":"veo-3.1","status":"deprecated","deprecation_date":"2025-10-15","license":"proprietary","model_type":"video","modalities":{"input":["text"],"output":["video"]},"open_weight":false,"last_updated":"2026-03-26"},{"id":"veo-3.1-generate-preview","name":"veo-3.1-generate-preview","created_by":"google","source":"official","last_updated":"2026-06-29","status":"active","context_window":1024,"model_type":"video","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["video"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"veo-3.1","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/veo-3.1-generate-preview","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 3.1 A state-of-the-art cinematic engine designed for high-end creative storytelling and experimental video production. Veo 3.1 is best for professional-grade 4K output, natively synchronized audio generation, and complex camera movements that require the highest level of temporal consistency and artistic control.","tagline":"A state-of-the-art cinematic engine designed for high-end creative storytelling and experimental video production."},{"id":"veo-3.1-lite-generate-preview","name":"veo-3.1-lite-generate-preview","created_by":"google","source":"official","family":"veo-3.1","status":"active","context_window":1024,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/veo-3.1-lite-generate-preview","model_type":"video","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"open_weight":false,"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 3.1 Lite Preview Veo 3.1 Lite Preview is a high-efficiency, developer-first video model providing high-fidelity video generation, editing, and cinematic control. It leverages the state-of-the-art Veo 3.1 model to democratize professional-grade video AI by offering a scalable, programmable interface for creators and enterprises.","tagline":"The Interactions API is now generally available."}]}; +export const provider: ProviderWithModels = {"id":"google","name":"Google AI","region":"US","headquarters":"Mountain View, CA","founded":2010,"url":"https://ai.google.dev","api_url":"https://generativelanguage.googleapis.com/v1beta","docs_url":"https://ai.google.dev/docs","pricing_url":"https://ai.google.dev/pricing","description":"Google AI Studio provides access to Gemini models for developers building with the Gemini API.","type":"direct","playground_url":"https://aistudio.google.com","status_url":"https://status.cloud.google.com","sdk":{"python":"google-genai","javascript":"@google/genai"},"openai_compatible":true,"free_tier":true,"github_url":"https://github.com/google-gemini","models_url":"https://ai.google.dev/gemini-api/docs/models","twitter_url":"https://x.com/GoogleDeepMind","blog_url":"https://deepmind.google/blog","terms_url":"https://ai.google.dev/gemini-api/terms","support_url":"https://ai.google.dev/gemini-api/docs/troubleshoot-ai-studio","icon":"\n \n \n \n \n","models":[{"id":"antigravity-preview-05-2026","name":"antigravity-preview-05-2026","created_by":"google","source":"official","status":"active","context_window":1048576,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/antigravity-preview-05-2026","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"open_weight":false,"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-05-23"},{"id":"deep-research-max-preview-04-2026","name":"deep-research-max-preview-04-2026","created_by":"google","source":"official","family":"deep-research","status":"active","context_window":1048576,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/deep-research-max-preview-04-2026","model_type":"reasoning","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"open_weight":false,"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-04-22"},{"id":"deep-research-preview-04-2026","name":"deep-research-preview-04-2026","created_by":"google","source":"official","family":"deep-research","status":"active","context_window":1048576,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/deep-research-preview-04-2026","model_type":"reasoning","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"open_weight":false,"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-04-22"},{"id":"deep-research-pro-preview-12-2025","name":"deep-research-pro-preview-12-2025","created_by":"google","source":"official","last_updated":"2026-04-22","status":"active","context_window":1048576,"max_output_tokens":65536,"model_type":"reasoning","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"deep-research","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/deep-research-pro-preview-12-2025","open_weight":false},{"id":"embedding-001","name":"embedding-001","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","successor":"gemini-embedding-2","model_type":"embed","modalities":{"input":["text"],"output":["text"]},"family":"embed","license":"proprietary","open_weight":false},{"id":"embedding-gecko-001","name":"embedding-gecko-001","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","successor":"gemini-embedding-2","model_type":"embed","modalities":{"input":["text"],"output":["text"]},"family":"embed","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-001","name":"gemini-2.0-flash-001","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.5-flash"},{"id":"gemini-2.0-flash-lite-001","name":"gemini-2.0-flash-lite-001","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.1-flash-lite"},{"id":"gemini-2.0-flash-lite-preview-02-05","name":"gemini-2.0-flash-lite-preview-02-05","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-2.5-flash-lite","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-lite-preview","name":"gemini-2.0-flash-lite-preview","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-2.5-flash-lite","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-lite","name":"gemini-2.0-flash-lite","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","knowledge_cutoff":"2024-08","context_window":1048576,"max_output_tokens":8192,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.075,"output":0.3,"batch_input":0.0375,"batch_output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.075,null,0.3]},{"label":"Batch","values":[0.0375,null,0.15]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.0-flash-lite","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.1-flash-lite"},{"id":"gemini-2.0-flash-live-001","name":"gemini-2.0-flash-live-001","created_by":"google","source":"official","last_updated":"2026-03-27","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-3.1-flash-live-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-preview-image-generation","name":"gemini-2.0-flash-preview-image-generation","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-11-14","successor":"gemini-2.5-flash-image","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash","name":"gemini-2.0-flash","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","knowledge_cutoff":"2024-08","context_window":1048576,"max_output_tokens":8192,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.1,"output":0.4,"cached_input":0.025,"batch_input":0.05,"batch_output":0.2,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.1,0.025,0.4]},{"label":"Batch","values":[0.05,null,0.2]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.0-flash","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.5-flash"},{"id":"gemini-2.5-computer-use-preview-10-2025","name":"gemini-2.5-computer-use-preview-10-2025","created_by":"google","source":"official","last_updated":"2026-04-22","family":"gemini-2.5","status":"active","context_window":128000,"max_output_tokens":64000,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":10,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.25,null,10]},{"label":"Batch","values":[null,null,null]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-computer-use-preview-10-2025","open_weight":false},{"id":"gemini-2.5-flash-image-preview","name":"gemini-2.5-flash-image-preview","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2026-01-15","successor":"gemini-2.5-flash-image","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-image","name":"gemini-2.5-flash-image","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-06","context_window":65536,"max_output_tokens":32768,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":0.039,"batch_input":0.15,"batch_output":0.0195,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,0.039]},{"label":"Batch","values":[0.15,null,0.0195]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash-image","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Image (Nano Banana) Our best engine for high-velocity visual creation, offering state-of-the-art speed and efficiency. Gemini 2.5 Flash Image, also known as Nano Banana, is best for high-volume generation, conversational image editing, and low-latency creative workflows that require native multimodal understanding.","tagline":"Our best engine for high-velocity visual creation, offering state-of-the-art speed and efficiency."},{"id":"gemini-2.5-flash-lite-preview-09-2025","name":"gemini-2.5-flash-lite-preview-09-2025","created_by":"google","source":"official","last_updated":"2026-05-10","family":"gemini-2.5","status":"deprecated","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash-lite-preview-09-2025","open_weight":false,"deprecation_date":"2026-03-31","successor":"gemini-3.1-flash-lite"},{"id":"gemini-2.5-flash-lite","name":"gemini-2.5-flash-lite","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.1,"output":0.4,"cached_input":0.01,"batch_input":0.05,"batch_output":0.2,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.1,0.01,0.4]},{"label":"Batch","values":[0.05,null,0.2]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash-lite","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash-Lite Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks. Gemini 2.5 Flash-Lite is best for high-volume classification, simple data extraction, and extremely low-latency applications where budget and speed are the primary constraints.","tagline":"Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks."},{"id":"gemini-2.5-flash-native-audio-preview-12-2025","name":"gemini-2.5-flash-native-audio-preview-12-2025","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":8192,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash-native-audio-preview-12-2025","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Live Preview The Live API enables low-latency, real-time voice and video interactions with Gemini 2.5 Flash. It processes continuous streams of audio, video, or text to deliver immediate, human-like spoken responses, creating a natural conversational experience for your users.","tagline":"The Live API enables low-latency, real-time voice and video interactions with Gemini 2.5 Flash."},{"id":"gemini-2.5-flash-preview-05-20","name":"gemini-2.5-flash-preview-05-20","created_by":"google","source":"official","last_updated":"2026-05-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-11-18","successor":"gemini-3.5-flash","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-preview-09-2025","name":"gemini-2.5-flash-preview-09-2025","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash-preview-09-2025","open_weight":false},{"id":"gemini-2.5-flash-preview-09-25","name":"gemini-2.5-flash-preview-09-25","created_by":"google","source":"official","last_updated":"2026-05-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2026-02-17","successor":"gemini-3.5-flash","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-preview-tts","name":"gemini-2.5-flash-preview-tts","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","context_window":8192,"max_output_tokens":16384,"model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":0.5,"output":10,"batch_input":0.25,"batch_output":5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.5,null,10]},{"label":"Batch","values":[0.25,null,5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash-preview-tts","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Text-to-Speech Our fastest engine for high-fidelity speech synthesis, offering low-latency and cost-efficient audio generation. Gemini 2.5 Flash TTS is best for real-time assistants, high-volume narration, and conversational use cases that require fine-grained control over voice style and pacing.","tagline":"Our fastest engine for high-fidelity speech synthesis, offering low-latency and cost-efficient audio generation."},{"id":"gemini-2.5-flash","name":"gemini-2.5-flash","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":2.5,"cached_input":0.03,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,0.03,2.5]},{"label":"Batch","values":[0.15,null,1.25]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-flash","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Our best model in terms of price-performance, offering well-rounded capabilities. 2.5 Flash is best for large scale processing, low-latency, high volume tasks that require thinking, and agentic use cases.","tagline":"Our best model in terms of price-performance, offering well-rounded capabilities."},{"id":"gemini-2.5-pro-preview-03-25","name":"gemini-2.5-pro-preview-03-25","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-12-02","successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-pro-preview-05-06","name":"gemini-2.5-pro-preview-05-06","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-12-02","successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-pro-preview-06-05","name":"gemini-2.5-pro-preview-06-05","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-12-02","successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-pro-preview-tts","name":"gemini-2.5-pro-preview-tts","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","context_window":8192,"max_output_tokens":16384,"model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":1,"output":20,"batch_input":0.5,"batch_output":10,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1,null,20]},{"label":"Batch","values":[0.5,null,10]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-pro-preview-tts","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Pro Text-to-Speech Our premium engine for studio-quality speech synthesis, offering high-fidelity and sophisticated audio generation. Gemini 2.5 Pro TTS is best for long-form content, professional narrations, and complex creative workflows that require the highest level of vocal clarity and natural prosody.","tagline":"Our premium engine for studio-quality speech synthesis, offering high-fidelity and sophisticated audio generation."},{"id":"gemini-2.5-pro","name":"gemini-2.5-pro","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":1.25,"output":10,"cached_input":0.125,"batch_input":0.625,"batch_output":5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.25,0.125,10]},{"label":"Batch","values":[0.625,null,5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-2.5-pro","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Pro Our state-of-the-art thinking model, capable of reasoning over complex problems in code, math, and STEM, as well as analyzing large datasets, codebases, and documents using long context.","tagline":"Our state-of-the-art thinking model, capable of reasoning over complex problems in code, math, and STEM, as well as analyzing large datasets, codebases, and documents using long context."},{"id":"gemini-3-flash-preview","name":"gemini-3-flash-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.5,"output":3,"cached_input":0.05,"batch_input":0.25,"batch_output":1.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.5,0.05,3]},{"label":"Batch","values":[0.25,null,1.5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3-flash-preview","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3 Flash Preview The best model in the world for multimodal understanding, and our most powerful agentic and vibe-coding model yet, delivering richer visuals and deeper interactivity, all built on a foundation of state-of-the-art reasoning.","tagline":"The best model in the world for multimodal understanding, and our most powerful agentic and vibe-coding model yet, delivering richer visuals and deeper interactivity, all built on a foundation of stat"},{"id":"gemini-3-pro-image-preview","name":"gemini-3-pro-image-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3","status":"deprecated","knowledge_cutoff":"2025-01","context_window":65536,"max_output_tokens":32768,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":2,"output":12,"batch_input":1,"batch_output":6,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[2,null,12]},{"label":"Batch","values":[1,null,6]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3-pro-image-preview","open_weight":false,"deprecation_date":"2026-06-25","successor":"gemini-3-pro-image"},{"id":"gemini-3-pro-image","name":"gemini-3-pro-image","created_by":"google","source":"official","family":"gemini-3","status":"active","knowledge_cutoff":"2025-01","context_window":65536,"max_output_tokens":32768,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3-pro-image","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":2,"output":12,"batch_input":1,"batch_output":6,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[2,null,12]},{"label":"Batch","values":[1,null,6]}]}]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3 Pro Image Nano Banana Pro is a sophisticated reasoning-driven engine for professional-grade image editing and generation, offering studio-quality precision and advanced creative control. Nano Banana Pro is best for complex graphic design, high-fidelity product mockups, and factual data visualizations that require accurate text rendering and real-world grounding via Google Search.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3-pro-preview","name":"gemini-3-pro-preview","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-3","status":"deprecated","deprecation_date":"2026-03-09","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3-pro-preview","open_weight":false},{"id":"gemini-3.1-flash-image-preview","name":"gemini-3.1-flash-image-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3.1","status":"deprecated","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":32768,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.5,"output":3,"batch_input":0.25,"batch_output":1.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.5,null,3]},{"label":"Batch","values":[0.25,null,1.5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-image-preview","open_weight":false,"deprecation_date":"2026-06-25","successor":"gemini-3.1-flash-image"},{"id":"gemini-3.1-flash-image","name":"gemini-3.1-flash-image","created_by":"google","source":"official","family":"gemini-3.1","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":32768,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-image","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":0.5,"output":3,"batch_input":0.25,"batch_output":1.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.5,null,3]},{"label":"Batch","values":[0.25,null,1.5]}]}]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash Image Nano Banana 2 provides high-quality image generation and conversational editing at a mainstream price point and low latency. It serves as the high-efficiency counterpart to Gemini 3 Pro Image , optimized for speed and high-volume developer use cases. Key updates: New output resolution options: New support for 0.5K, 2K and 4K, default 1K New Image Search Grounding: Integration of both text and image search results to inform generation with real-time web data Supported with Thinking on or off New 1:4, 4:1, 1:8 and 8:1 aspect ratios Improved aspect ratio adherence Improved image quality and consistency Improved i18n text rendering","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.1-flash-lite-preview","name":"gemini-3.1-flash-lite-preview","created_by":"google","source":"official","last_updated":"2026-05-29","family":"gemini-3.1","status":"deprecated","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.25,"output":1.5,"cached_input":0.025,"batch_input":0.125,"batch_output":0.75,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.25,0.025,1.5]},{"label":"Batch","values":[0.125,null,0.75]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-lite-preview","open_weight":false,"description":"Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks. Gemini 3.1 Flash-Lite is best for high-volume agentic tasks, simple data extraction, and extremely low-latency applications where budget and speed are the primary constraints.","tagline":"Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks.","deprecation_date":"2026-05-25","successor":"gemini-3.1-flash-lite"},{"id":"gemini-3.1-flash-lite","name":"gemini-3.1-flash-lite","created_by":"google","source":"official","family":"gemini-3.1","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash-Lite Gemini 3.1 Flash-Lite is a low-latency, cost-effective multimodal model optimized for high-frequency, lightweight tasks. The model supports text, image, video, audio, and PDF inputs, and is designed for high-volume agentic workflows, simple data extraction, and applications where latency and API cost are the primary constraints.","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-lite","model_type":"chat","tagline":"The model supports text, image, video, audio, and PDF inputs, and is designed for high-volume agentic workflows, simple data extraction, and applications where latency and API cost are the primary con","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.25,"output":1.5,"cached_input":0.025,"batch_input":0.125,"batch_output":0.75,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.25,0.025,1.5]},{"label":"Batch","values":[0.125,null,0.75]}]}]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29"},{"id":"gemini-3.1-flash-live-preview","name":"gemini-3.1-flash-live-preview","created_by":"google","source":"official","family":"gemini-3.1","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-live-preview","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.75,"output":4.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.75,null,4.5]}]}]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash Live Preview Gemini 3.1 Flash Live Preview is our low-latency, audio-to-audio model optimized for real-time dialogue and voice-first AI applications with acoustic nuance detection, numeric precision, and multimodal awareness.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.1-flash-tts-preview","name":"gemini-3.1-flash-tts-preview","created_by":"google","source":"official","family":"gemini-3.1","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash TTS (Text-to-Speech) Preview The Gemini 3.1 Flash TTS Preview model provides powerful, low-latency speech generation with natural outputs, steerable prompts, and new expressive audio tags for precise narration control.","status":"active","knowledge_cutoff":"2025-01","context_window":8192,"max_output_tokens":16384,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.1-flash-tts-preview","model_type":"tts","tagline":"The Gemini 3.1 Flash TTS Preview model provides powerful, low-latency speech generation with natural outputs, steerable prompts, and new expressive audio tags for precise narration control.","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":1,"output":20,"batch_input":0.5,"batch_output":10,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1,null,20]},{"label":"Batch","values":[0.5,null,10]}]}]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29"},{"id":"gemini-3.1-pro-preview","name":"gemini-3.1-pro-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3.1","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":2,"output":12,"cached_input":0.2,"batch_input":1,"batch_output":6,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[2,0.2,12]},{"label":"Batch","values":[1,null,6]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.1-pro-preview","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Pro Preview Built to refine the performance and reliability of the Gemini 3 Pro series, Gemini 3.1 Pro Preview provides better thinking, improved token efficiency, and a more grounded, factually consistent experience. It's optimized for software engineering behavior and usability, as well as agentic workflows requiring precise tool usage and reliable multi-step execution across real-world domains.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.5-flash","name":"gemini-3.5-flash","created_by":"google","source":"official","family":"gemini-3.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.5-flash","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":1.5,"output":9,"cached_input":0.15,"batch_input":0.75,"batch_output":4.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.5,0.15,9]},{"label":"Batch","values":[0.75,null,4.5]}]}]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.5 Flash Gemini 3.5 Flash provides sustained frontier-level intelligence optimized for real-world tasks at a higher speed and lower cost. Designed for the agentic era, it excels at sub-agent deployment, multi-step workflows, and long-horizon tasks at scale. This model is particularly effective for rapid agentic loops involving complex coding cycles and iterations.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.5-live-translate-preview","name":"gemini-3.5-live-translate-preview","created_by":"google","source":"official","family":"gemini-3.5","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-3.5-live-translate-preview","model_type":"translation","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":3.5,"output":21,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[3.5,null,21]}]}]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.5 Live Translate Gemini 3.5 Live Translate is our low-latency, audio-to-audio model optimized for real-time translation of spoken conversations. It enables seamless, bidirectional translation with high accuracy and natural voice output.","tagline":"The Interactions API is now generally available."},{"id":"gemini-embedding-001","name":"gemini-embedding-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","context_window":2048,"model_type":"embed","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"family":"gemini-embedding","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-embedding-001","open_weight":false},{"id":"gemini-embedding-2-preview","name":"gemini-embedding-2-preview","created_by":"google","source":"official","last_updated":"2026-03-23","status":"active","context_window":8192,"model_type":"embed","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"family":"gemini-embedding","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-embedding-2-preview","open_weight":false},{"id":"gemini-embedding-2","name":"gemini-embedding-2","created_by":"google","source":"official","family":"gemini-embedding","status":"active","context_window":8192,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-embedding-2","model_type":"embed","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.2,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.2,null,null]},{"label":"Batch","values":[0.1,null,null]}]}],"batch_input":0.1},"open_weight":false,"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-05-29"},{"id":"gemini-embedding-exp-03-07","name":"gemini-embedding-exp-03-07","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","successor":"gemini-embedding-2","model_type":"embed","modalities":{"input":["text"],"output":["text"]},"family":"gemini-embedding","license":"proprietary","open_weight":false},{"id":"gemini-embedding-exp","name":"gemini-embedding-exp","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","successor":"gemini-embedding-2","model_type":"embed","modalities":{"input":["text"],"output":["text"]},"family":"gemini-embedding","license":"proprietary","open_weight":false},{"id":"gemini-live-2.5-flash-preview","name":"gemini-live-2.5-flash-preview","created_by":"google","source":"official","last_updated":"2026-03-27","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-3.1-flash-live-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"family":"gemini-2.5","model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-robotics-er-1.5-preview","name":"gemini-robotics-er-1.5-preview","created_by":"google","source":"official","last_updated":"2026-06-29","status":"deprecated","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"gemini-1.5","model_type":"chat","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-robotics-er-1.5-preview","open_weight":false,"deprecation_date":"2026-04-30","successor":"gemini-robotics-er-1.6-preview","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini Robotics-ER 1.5 Note: This version is planned for deprecation soon . See the models page for the latest model version. Gemini Robotics-ER 1.5 is a vision-language model (VLM) that brings Gemini's agentic capabilities to robotics. It's designed for advanced reasoning in the physical world, allowing robots to interpret complex visual data, perform spatial reasoning, and plan actions from natural language commands.","tagline":"The Interactions API is now generally available."},{"id":"gemini-robotics-er-1.6-preview","name":"gemini-robotics-er-1.6-preview","created_by":"google","source":"official","family":"gemini-1.6","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":65536,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/gemini-robotics-er-1.6-preview","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini Robotics-ER 1.6 Gemini Robotics-ER 1.6 is a vision-language model (VLM) that brings Gemini's agentic capabilities to robotics. It's designed for advanced reasoning in the physical world, allowing robots to interpret complex visual data, perform spatial reasoning, and plan actions from natural language commands.","tagline":"The Interactions API is now generally available."},{"id":"imagen-3.0-generate-002","name":"imagen-3.0-generate-002","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2025-11-10","successor":"imagen-4.0-generate-001","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-3.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-fast-generate-001","name":"imagen-4.0-fast-generate-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-generate-001","name":"imagen-4.0-generate-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-generate-preview-06-06","name":"imagen-4.0-generate-preview-06-06","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2026-02-17","successor":"imagen-4.0-generate-001","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-ultra-generate-001","name":"imagen-4.0-ultra-generate-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-ultra-generate-preview-06-06","name":"imagen-4.0-ultra-generate-preview-06-06","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2026-02-17","successor":"imagen-4.0-ultra-generate-001","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen","name":"imagen","created_by":"google","source":"official","last_updated":"2026-06-29","status":"active","context_window":480,"model_type":"image","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["image"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"imagen","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/imagen","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Imagen 4 The Imagen 4 standard, ultra, and fast endpoints are deprecated and will be shut down on **August 17, 2026**; migrate to Gemini 3.1 Flash Image to avoid service interruptions. A high-performance engine for advanced visual synthesis, offering sophisticated creative control and photorealistic output. Use Imagen 4 for professional branding, intricate scene composition, and high-fidelity design tasks that require precise text rendering and complex lighting.","tagline":"A high-performance engine for advanced visual synthesis, offering sophisticated creative control and photorealistic output."},{"id":"lyria-3-clip-preview","name":"lyria-3-clip-preview","created_by":"google","source":"official","status":"active","context_window":131072,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/lyria-3-clip-preview","model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["audio"]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Lyria 3 Clip Preview Lyria 3 Clip Preview is Google's model optimized for generating short musical clips, loops, and previews. It generates 30-second high-quality, 48kHz stereo audio from text prompts or image inputs.","tagline":"The Interactions API is now generally available."},{"id":"lyria-3-pro-preview","name":"lyria-3-pro-preview","created_by":"google","source":"official","status":"active","context_window":131072,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/lyria-3-pro-preview","model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["audio"]},"open_weight":false,"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Lyria 3 Pro Preview Lyria 3 Pro Preview is Google's flagship music generation model. It is optimized for generating full-length songs with complex structural coherence, including multiple verses, choruses, and bridges. It generates high-quality, 48kHz stereo audio from text prompts or image inputs.","tagline":"The Interactions API is now generally available."},{"id":"lyria-realtime-exp","name":"lyria-realtime-exp","created_by":"google","source":"official","last_updated":"2026-03-24","status":"active","model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/lyria-realtime-exp","open_weight":false},{"id":"text-embedding-004","name":"text-embedding-004","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2026-01-14","successor":"gemini-embedding-2","model_type":"embed","modalities":{"input":["text"],"output":["text"]},"family":"text-embedding","license":"proprietary","open_weight":false},{"id":"veo-2.0-generate-001","name":"veo-2.0-generate-001","created_by":"google","source":"official","last_updated":"2026-06-30","status":"deprecated","model_type":"video","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["video"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"veo-2.0","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/veo-2.0-generate-001","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 2.0 This model is deprecated and will be shut down on **June 30, 2026**; migrate to Veo 3.1 Preview or the GA models available through the Gemini Enterprise Agent Platform to avoid service interruptions. Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows. Veo 2.0 is best for standard 1080p content creation, social media assets, and high-volume video tasks that prioritize reliable character consistency and predictable sub-second generation speeds.","tagline":"Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows.","deprecation_date":"2026-06-30","successor":["veo-3.1-generate-preview","the GA models on the Gemini Enterprise Agent Platf","m"]},{"id":"veo-3.0-fast-generate-001","name":"veo-3.0-fast-generate-001","created_by":"google","source":"official","family":"veo-3.0","status":"deprecated","license":"proprietary","model_type":"video","modalities":{"input":["text"],"output":["video"]},"open_weight":false,"last_updated":"2026-06-30","deprecation_date":"2026-06-30","successor":["veo-3.1-fast-generate-preview","the GA models on the Gemini Enterprise Agent Platf","m"]},{"id":"veo-3.0-fast-generate-preview","name":"veo-3.0-fast-generate-preview","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2025-11-12","successor":"veo-3.1-fast-generate-preview","model_type":"video","modalities":{"input":["text"],"output":["video"]},"family":"veo-3.0","license":"proprietary","open_weight":false},{"id":"veo-3.0-generate-001","name":"veo-3.0-generate-001","created_by":"google","source":"official","family":"veo-3.0","status":"deprecated","license":"proprietary","model_type":"video","modalities":{"input":["text"],"output":["video"]},"open_weight":false,"last_updated":"2026-06-30","deprecation_date":"2026-06-30","successor":["veo-3.1-generate-preview","the GA models on the Gemini Enterprise Agent Platf","m"]},{"id":"veo-3.0-generate-preview","name":"veo-3.0-generate-preview","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2025-11-12","successor":"veo-3.1-generate-preview","model_type":"video","modalities":{"input":["text"],"output":["video"]},"family":"veo-3.0","license":"proprietary","open_weight":false},{"id":"veo-3.1-fast-generate-preview","name":"veo-3.1-fast-generate-preview","created_by":"google","source":"official","family":"veo-3.1","status":"deprecated","deprecation_date":"2025-10-15","license":"proprietary","model_type":"video","modalities":{"input":["text"],"output":["video"]},"open_weight":false,"last_updated":"2026-03-26"},{"id":"veo-3.1-generate-preview","name":"veo-3.1-generate-preview","created_by":"google","source":"official","last_updated":"2026-06-29","status":"active","context_window":1024,"model_type":"video","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["video"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"veo-3.1","license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/veo-3.1-generate-preview","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 3.1 A state-of-the-art cinematic engine designed for high-end creative storytelling and experimental video production. Veo 3.1 is best for professional-grade 4K output, natively synchronized audio generation, and complex camera movements that require the highest level of temporal consistency and artistic control.","tagline":"A state-of-the-art cinematic engine designed for high-end creative storytelling and experimental video production."},{"id":"veo-3.1-lite-generate-preview","name":"veo-3.1-lite-generate-preview","created_by":"google","source":"official","family":"veo-3.1","status":"active","context_window":1024,"license":"proprietary","page_url":"https://ai.google.dev/gemini-api/docs/models/veo-3.1-lite-generate-preview","model_type":"video","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"open_weight":false,"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 3.1 Lite Preview Veo 3.1 Lite Preview is a high-efficiency, developer-first video model providing high-fidelity video generation, editing, and cinematic control. It leverages the state-of-the-art Veo 3.1 model to democratize professional-grade video AI by offering a scalable, programmable interface for creators and enterprises.","tagline":"The Interactions API is now generally available."}]}; export const models: Model[] = provider.models.map((m) => ({ ...m, provider: provider.id })); diff --git a/packages/npm/src/providers/huggingface.ts b/packages/npm/src/providers/huggingface.ts index 3916ac7fe..d10ec0101 100644 --- a/packages/npm/src/providers/huggingface.ts +++ b/packages/npm/src/providers/huggingface.ts @@ -3,6 +3,6 @@ import type { ProviderWithModels, Model } from '../types'; -export const provider: ProviderWithModels = {"id":"huggingface","name":"Hugging Face","region":"US","headquarters":"New York, NY","founded":2016,"url":"https://huggingface.co","api_url":"https://router.huggingface.co/v1","docs_url":"https://huggingface.co/docs/api-inference","pricing_url":"https://huggingface.co/pricing","description":"The AI community platform hosting open-source models with serverless inference endpoints.","type":"aggregator","sdk":{"python":"huggingface_hub","javascript":"@huggingface/inference"},"openai_compatible":true,"free_tier":true,"github_url":"https://github.com/huggingface","models_url":"https://huggingface.co/models","twitter_url":"https://x.com/huggingface","discord_url":"https://discord.com/invite/hugging-face-879548962464493619","blog_url":"https://huggingface.co/blog","terms_url":"https://huggingface.co/terms-of-service","support_url":"https://huggingface.co/support","icon":"\n \n","models":[{"id":"0xgr3y/Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-tall_tame_panther","name":"Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-tall_tame_panther","created_by":"0xgr3y","source":"official","release_date":"2025-11-13","context_window":32768,"license":"mit","parameters":0.49,"page_url":"https://huggingface.co/0xgr3y/Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-tall_tame_panther","architecture":"transformer","model_type":"code","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"aaditya/Llama3-OpenBioLLM-8B","name":"Llama3-OpenBioLLM-8B","created_by":"aaditya","source":"official","last_updated":"2026-03-24","page_url":"https://huggingface.co/aaditya/Llama3-OpenBioLLM-8B","model_type":"chat","capabilities":{"streaming":true,"fine_tuning":true},"description":"Introducing OpenBioLLM-8B: A State-of-the-Art Open Source Biomedical Large Language Model","release_date":"2024-04-20","context_window":8192,"license":"llama3","tagline":"Introducing OpenBioLLM-8B: A State-of-the-Art Open Source Biomedical Large Language Model","architecture":"transformer","open_weight":true,"modalities":{"input":["text"],"output":["text"]}},{"id":"allenai/Olmo-3-7B-Instruct","name":"Olmo-3-7B-Instruct","created_by":"allenai","source":"official","last_updated":"2026-06-29","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":7.3,"page_url":"https://huggingface.co/allenai/Olmo-3-7B-Instruct","release_date":"2025-11-19","context_window":65536,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"allenai/Olmo-3.1-32B-Instruct","name":"Olmo-3.1-32B-Instruct","created_by":"allenai","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":32,"page_url":"https://huggingface.co/allenai/Olmo-3.1-32B-Instruct","release_date":"2025-12-10","context_window":65536,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"alpindale/Llama-3.2-1B-Instruct","name":"Llama-3.2-1B-Instruct","created_by":"alpindale","source":"official","family":"Llama-3.2","release_date":"2024-09-25","context_window":131072,"license":"llama3.2","parameters":1.2,"page_url":"https://huggingface.co/alpindale/Llama-3.2-1B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-01"},{"id":"anthracite-org/magnum-v4-72b","name":"magnum-v4-72b","created_by":"anthracite-org","source":"official","description":"This is a series of models designed to replicate the prose quality of the Claude 3 models, specifically Sonnet and Opus.","release_date":"2024-09-20","context_window":32768,"license":"apache-2.0","parameters":73,"page_url":"https://huggingface.co/anthracite-org/magnum-v4-72b","architecture":"transformer","tagline":"This is a series of models designed to replicate the prose quality of the Claude 3 models, specifically Sonnet and Opus.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"arcee-ai/Trinity-Large-Thinking","name":"Trinity-Large-Thinking","created_by":"arcee-ai","source":"official","description":"src=\"https://cdn-uploads.huggingface.co/production/uploads/6435718aaaef013d1aec3b8b/i-v1KyAMOW_mgVGeic9WJ.png\" alt=\"Arcee Trinity Large Thinking\" style=\"max-width: 100%; height: auto;\" >","release_date":"2026-04-01","context_window":262144,"license":"apache-2.0","parameters":399,"active_parameters":6.2,"page_url":"https://huggingface.co/arcee-ai/Trinity-Large-Thinking","architecture":"moe","tagline":"src=\"https://cdn-uploads.huggingface.co/production/uploads/6435718aaaef013d1aec3b8b/i-v1KyAMOW_mgVGeic9WJ.png\" alt=\"Arcee Trinity Large Thinking\" style=\"max-width: 100%; height: auto;\" >","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-10"},{"id":"argilla/Llama-3.2-1B-Instruct-APIGen-FC-v0.1","name":"Llama-3.2-1B-Instruct-APIGen-FC-v0.1","created_by":"argilla","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.2","model_type":"chat","parameters":1,"page_url":"https://huggingface.co/argilla/Llama-3.2-1B-Instruct-APIGen-FC-v0.1","description":"This model is a fine-tuned version of [meta-llama/Llama-3.2-1B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct) on [argilla-warehouse/apigen-synth-trl](https://huggingface.co/datasets/argilla-warehouse/apigen-synth-trl) dataset, a version of [argilla/Synth-APIGen-v0.1](https://huggingface.co/datasets/argilla-warehouse/Synth-APIGen-v0.1) ready to do SFT on top of it. It has been trained using [TRL](https://github.com/huggingface/trl).","release_date":"2024-10-07","context_window":131072,"license":"apache-2.0","tagline":"This model is a fine-tuned version of [meta-llama/Llama-3.2-1B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct) on [argilla-warehouse/apigen-synth-trl](https://huggingface.co/datasets/argilla-warehouse/apigen-synth-trl) dataset, a version of [argilla/Synth-APIGen-v0.1](https://huggingface.co/datasets/argilla-warehouse/Synth-APIGen-v0.1) ready to do SFT on top of it.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"argilla-warehouse/Llama-3.2-1B-Instruct-v2-FC","name":"Llama-3.2-1B-Instruct-v2-FC","created_by":"argilla-warehouse","source":"official","last_updated":"2026-03-23","capabilities":{"streaming":true,"tool_call":true},"family":"Llama-3.2","model_type":"chat","parameters":1,"page_url":"https://huggingface.co/argilla-warehouse/Llama-3.2-1B-Instruct-v2-FC","description":"This model is a fine-tuned version of [meta-llama/Llama-3.2-1B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct) on the [argilla-warehouse/apigen-smollm-trl-FC](https://huggingface.co/datasets/argilla-warehouse/apigen-smollm-trl-FC) dataset. It has been trained using [TRL](https://github.com/huggingface/trl).","release_date":"2024-10-20","context_window":131072,"tagline":"This model is a fine-tuned version of [meta-llama/Llama-3.2-1B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct) on the [argilla-warehouse/apigen-smollm-trl-FC](https://huggingface.co/datasets/argilla-warehouse/apigen-smollm-trl-FC) dataset.","architecture":"transformer","tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"baseten/Llama-3.2-3B-Instruct-pythonic","name":"Llama-3.2-3B-Instruct-pythonic","created_by":"baseten","source":"official","family":"Llama-3.2","release_date":"2025-09-12","context_window":131072,"license":"llama3.2","parameters":3.2,"page_url":"https://huggingface.co/baseten/Llama-3.2-3B-Instruct-pythonic","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"codellama/CodeLlama-7b-Instruct-hf","name":"CodeLlama-7b-Instruct-hf","created_by":"codellama","source":"official","family":"codellama","description":"Code Llama is a collection of pretrained and fine-tuned generative text models ranging in scale from 7 billion to 34 billion parameters. This is the repository for the 7B instruct-tuned version in the Hugging Face Transformers format. This model is designed for general code synthesis and understanding. Links to other models can be found in the index at the bottom.","release_date":"2023-08-24","context_window":16384,"license":"llama2","parameters":6.7,"page_url":"https://huggingface.co/codellama/CodeLlama-7b-Instruct-hf","architecture":"transformer","model_type":"code","tagline":"Code Llama is a collection of pretrained and fine-tuned generative text models ranging in scale from 7 billion to 34 billion parameters.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"deepcogito/cogito-v1-preview-qwen-32B","name":"cogito-v1-preview-qwen-32B","created_by":"deepcogito","source":"official","release_date":"2025-03-31","context_window":131072,"license":"apache-2.0","page_url":"https://huggingface.co/deepcogito/cogito-v1-preview-qwen-32B","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29","parameters":33},{"id":"DeepMount00/Llama-3-8b-Ita","name":"Llama-3-8b-Ita","created_by":"deepmount00","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/DeepMount00/Llama-3-8b-Ita","description":"**💡 Found this resource helpful?** Creating and maintaining open source AI models and datasets requires significant computational resources. If this work has been valuable to you, consider [supporting my research](https://buymeacoffee.com/michele.montebovi) to help me continue building tools that benefit the entire AI community. Every contribution directly funds more open source innovation! ☕","release_date":"2024-05-01","context_window":8192,"license":"llama3","tagline":"**💡 Found this resource helpful?** Creating and maintaining open source AI models and datasets requires significant computational resources.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"deepseek-ai/DeepSeek-R1-0528-Qwen3-8B","name":"DeepSeek-R1-0528-Qwen3-8B","created_by":"deepseek","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"reasoning","parameters":8.2,"page_url":"https://huggingface.co/deepseek-ai/DeepSeek-R1-0528-Qwen3-8B","release_date":"2025-05-29","context_window":131072,"license":"mit","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"defog/sqlcoder-7b-2","name":"sqlcoder-7b-2","created_by":"defog","source":"official","description":"The model weights were updated at 7 AM UTC on Feb 7, 2024. The new model weights lead to a much more performant model – particularly for joins.","release_date":"2024-02-05","context_window":16384,"license":"cc-by-sa-4.0","parameters":6.7,"page_url":"https://huggingface.co/defog/sqlcoder-7b-2","architecture":"transformer","tagline":"The model weights were updated at 7 AM UTC on Feb 7, 2024.","capabilities":{"streaming":true,"fine_tuning":true},"open_weight":true,"last_updated":"2026-06-18"},{"id":"DeSTA-ntu/Llama-3.1-8B-Instruct","name":"Llama-3.1-8B-Instruct","created_by":"desta-ntu","source":"official","family":"Llama-3.1","release_date":"2025-07-06","context_window":131072,"parameters":8,"page_url":"https://huggingface.co/DeSTA-ntu/Llama-3.1-8B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"dicta-il/DictaLM-3.0-1.7B-Instruct","name":"DictaLM-3.0-1.7B-Instruct","created_by":"dicta-il","source":"official","description":"[](https://dicta.org.il)","release_date":"2025-12-01","context_window":62080,"license":"apache-2.0","page_url":"https://huggingface.co/dicta-il/DictaLM-3.0-1.7B-Instruct","architecture":"transformer","tagline":"[](https://dicta.org.il)","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-06-10"},{"id":"dphn/Dolphin-Mistral-24B-Venice-Edition","name":"Dolphin-Mistral-24B-Venice-Edition","created_by":"dphn","source":"official","description":"Website: https://dphn.ai Twitter: https://x.com/dphnAI Web Chat: https://chat.dphn.ai Telegram bot: https://t.me/DolphinAI_bot","release_date":"2025-06-12","context_window":32768,"license":"apache-2.0","parameters":24,"page_url":"https://huggingface.co/dphn/Dolphin-Mistral-24B-Venice-Edition","architecture":"transformer","tagline":"Website: https://dphn.ai Twitter: https://x.com/dphnAI Web Chat: https://chat.dphn.ai Telegram bot: https://t.me/DolphinAI_bot","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-07"},{"id":"Efficient-Large-Model/gemma-2-2b-it","name":"gemma-2-2b-it","created_by":"efficient-large-model","source":"official","last_updated":"2026-03-24","family":"gemma-2","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":2.6,"page_url":"https://huggingface.co/Efficient-Large-Model/gemma-2-2b-it","description":"**Model Page**: [Gemma](https://ai.google.dev/gemma/docs/base)","release_date":"2024-12-12","context_window":8192,"license":"gemma","tagline":"**Model Page**: [Gemma](https://ai.google.dev/gemma/docs/base)","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"EssentialAI/rnj-1-instruct","name":"rnj-1-instruct","created_by":"essentialai","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"page_url":"https://huggingface.co/EssentialAI/rnj-1-instruct","description":"Rnj-1 is a family of 8B parameter open-weight, dense models trained from scratch by Essential AI, optimized for code and STEM with capabilities on par with SOTA open-weight models. These models perform well across a range of programming languages and boast strong agentic capabilities (e.g., inside agentic frameworks like mini-SWE-agent), while also excelling at tool-calling. They additionally exhibit strong capabilities in math and science.","release_date":"2025-12-04","context_window":32768,"license":"apache-2.0","parameters":8.3,"tagline":"style=\"vertical-align: middle;\" src=\"https://img.shields.io/badge/%F0%9F%8C%90%20Website-essential.ai-4b9fe1?color=4b9fe1&logoColor=white\"/>","architecture":"transformer","open_weight":true,"tools":["function_calling"],"model_type":"chat","modalities":{"input":["text"],"output":["text"]}},{"id":"failspy/llama-3-70B-Instruct-abliterated","name":"llama-3-70B-Instruct-abliterated","created_by":"failspy","source":"official","family":"llama-3","description":"This is meta-llama/Llama-3-70B-Instruct with orthogonalized bfloat16 safetensor weights, generated with the methodology that was described in the preview paper/blog post: '[Refusal in LLMs is mediated by a single direction](https://www.alignmentforum.org/posts/jGuXSZgv6qfdhMCuJ/refusal-in-llms-is-mediated-by-a-single-direction)' which I encourage you to read to understand more.","release_date":"2024-05-07","context_window":8192,"license":"llama3","page_url":"https://huggingface.co/failspy/llama-3-70B-Instruct-abliterated","architecture":"transformer","model_type":"chat","tagline":"This is meta-llama/Llama-3-70B-Instruct with orthogonalized bfloat16 safetensor weights, generated with the methodology that was described in the preview paper/blog post: '[Refusal in LLMs is mediated","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-07"},{"id":"failspy/Meta-Llama-3-8B-Instruct-abliterated-v3","name":"Meta-Llama-3-8B-Instruct-abliterated-v3","created_by":"failspy","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/failspy/Meta-Llama-3-8B-Instruct-abliterated-v3","description":"[My Jupyter \"cookbook\" to replicate the methodology can be found here, refined library coming soon](https://huggingface.co/failspy/llama-3-70B-Instruct-abliterated/blob/main/ortho_cookbook.ipynb)","release_date":"2024-05-20","context_window":8192,"license":"llama3","tagline":"[My Jupyter \"cookbook\" to replicate the methodology can be found here, refined library coming soon](https://huggingface.co/failspy/llama-3-70B-Instruct-abliterated/blob/main/ortho_cookbook.ipynb)","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"farbodtavakkoli/OTel-LLM-0.6B-IT","name":"OTel-LLM-0.6B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-0.6B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":40960,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-0.6B-IT","architecture":"transformer","tagline":"**OTel-LLM-0.6B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-1.2B-IT","name":"OTel-LLM-1.2B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-1.2B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-03-10","context_window":128000,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-1.2B-IT","architecture":"transformer","tagline":"**OTel-LLM-1.2B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-1.7B-IT","name":"OTel-LLM-1.7B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-1.7B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":40960,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-1.7B-IT","architecture":"transformer","tagline":"**OTel-LLM-1.7B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-12B-IT","name":"OTel-LLM-12B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-12B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-12B-IT","architecture":"transformer","tagline":"**OTel-LLM-12B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-22"},{"id":"farbodtavakkoli/OTel-LLM-14B-IT","name":"OTel-LLM-14B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-14B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":40960,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-14B-IT","architecture":"transformer","tagline":"**OTel-LLM-14B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-1B-IT","name":"OTel-LLM-1B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-1B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":32768,"license":"apache-2.0","parameters":1,"page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-1B-IT","architecture":"transformer","tagline":"**OTel-LLM-1B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-20B-IT","name":"OTel-LLM-20B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-20B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-13","context_window":131072,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-20B-IT","architecture":"moe","tagline":"**OTel-LLM-20B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-270M-IT","name":"OTel-LLM-270M-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-270M-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":32768,"license":"apache-2.0","parameters":0.27,"page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-270M-IT","architecture":"transformer","tagline":"**OTel-LLM-270M-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-27B-IT","name":"OTel-LLM-27B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-27B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-27B-IT","architecture":"transformer","tagline":"**OTel-LLM-27B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-22"},{"id":"farbodtavakkoli/OTel-LLM-32B-IT","name":"OTel-LLM-32B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-32B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":65536,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-32B-IT","architecture":"transformer","tagline":"**OTel-LLM-32B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-4B-IT","name":"OTel-LLM-4B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-4B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","license":"apache-2.0","parameters":4.3,"page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-4B-IT","architecture":"transformer","tagline":"**OTel-LLM-4B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-7B-IT","name":"OTel-LLM-7B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-7B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":65536,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-7B-IT","architecture":"transformer","tagline":"**OTel-LLM-7B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-8.2B-IT","name":"OTel-LLM-8.2B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-8.2B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":40960,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-8.2B-IT","architecture":"transformer","tagline":"**OTel-LLM-8.2B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-8.3B-IT","name":"OTel-LLM-8.3B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-8.3B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":32768,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-8.3B-IT","architecture":"transformer","tagline":"**OTel-LLM-8.3B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"fdtn-ai/Foundation-Sec-8B-Instruct","name":"Foundation-Sec-8B-Instruct","created_by":"fdtn-ai","source":"official","release_date":"2025-07-29","context_window":131072,"license":"other","parameters":8,"page_url":"https://huggingface.co/fdtn-ai/Foundation-Sec-8B-Instruct","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-01"},{"id":"Featherless-Chat-Models/Mistral-7B-Instruct-v0.2","name":"Mistral-7B-Instruct-v0.2","created_by":"featherless-chat-models","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":7.2,"page_url":"https://huggingface.co/Featherless-Chat-Models/Mistral-7B-Instruct-v0.2","release_date":"2025-05-08","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"FlagAlpha/Llama3-Chinese-8B-Instruct","name":"Llama3-Chinese-8B-Instruct","created_by":"flagalpha","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":8,"page_url":"https://huggingface.co/FlagAlpha/Llama3-Chinese-8B-Instruct","description":"Llama3-Chinese-8B-Instruct基于Llama3-8B中文微调对话模型,由Llama中文社区和AtomEcho(原子回声)联合研发,我们会持续提供更新的模型参数,模型训练过程见 [https://llama.family](https://llama.family)。","release_date":"2024-04-23","context_window":8192,"license":"apache-2.0","tagline":"Llama3-Chinese-8B-Instruct基于Llama3-8B中文微调对话模型,由Llama中文社区和AtomEcho(原子回声)联合研发,我们会持续提供更新的模型参数,模型训练过程见 [https://llama.family](https://llama.family)。","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"google/gemma-1.1-2b-it","name":"gemma-1.1-2b-it","created_by":"google","source":"official","family":"gemma-1","release_date":"2024-03-26","license":"gemma","parameters":2.5,"page_url":"https://huggingface.co/google/gemma-1.1-2b-it","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"google/gemma-2-27b-it","name":"gemma-2-27b-it","created_by":"google","source":"official","family":"gemma-2","release_date":"2024-06-24","license":"gemma","parameters":27,"page_url":"https://huggingface.co/google/gemma-2-27b-it","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"google/gemma-2-2b-it","name":"gemma-2-2b-it","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-2","release_date":"2024-07-16","license":"gemma","parameters":2.6,"page_url":"https://huggingface.co/google/gemma-2-2b-it","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"]},{"id":"google/gemma-2-2b-jpn-it","name":"gemma-2-2b-jpn-it","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-2","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":2.6,"page_url":"https://huggingface.co/google/gemma-2-2b-jpn-it","release_date":"2024-09-25","license":"gemma","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"google/gemma-2-9b-it","name":"gemma-2-9b-it","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-2","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":9.2,"page_url":"https://huggingface.co/google/gemma-2-9b-it","release_date":"2024-06-24","license":"gemma","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"google/gemma-2b-it","name":"gemma-2b-it","created_by":"google","source":"official","family":"gemma-2b","release_date":"2024-02-08","license":"gemma","page_url":"https://huggingface.co/google/gemma-2b-it","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29","parameters":2.5},{"id":"google/gemma-3-1b-it","name":"gemma-3-1b-it","created_by":"google","source":"official","family":"gemma-3","release_date":"2025-03-10","license":"gemma","parameters":1,"page_url":"https://huggingface.co/google/gemma-3-1b-it","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"google/gemma-7b-it","name":"gemma-7b-it","created_by":"google","source":"official","family":"gemma-7b","release_date":"2024-02-13","license":"gemma","page_url":"https://huggingface.co/google/gemma-7b-it","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-18","parameters":8.5},{"id":"google/medgemma-27b-text-it","name":"medgemma-27b-text-it","created_by":"google","source":"official","release_date":"2025-05-19","license":"other","page_url":"https://huggingface.co/google/medgemma-27b-text-it","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-05-29","parameters":27},{"id":"GraySwanAI/Llama-3-8B-Instruct-RR","name":"Llama-3-8B-Instruct-RR","created_by":"grayswanai","source":"official","last_updated":"2026-03-23","capabilities":{"streaming":true,"tool_call":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/GraySwanAI/Llama-3-8B-Instruct-RR","description":"Llama-3-8B-Instruct-RR is a Llama-3 model with circuit breakers inserted using Representation Rerouting (RR).","release_date":"2024-07-08","context_window":8192,"tagline":"Llama-3-8B-Instruct-RR is a Llama-3 model with circuit breakers inserted using Representation Rerouting (RR).","architecture":"transformer","tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"GritLM/GritLM-7B","name":"GritLM-7B","created_by":"gritlm","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":7.2,"page_url":"https://huggingface.co/GritLM/GritLM-7B","description":"> GritLM is a generative representational instruction tuned language model. It unifies text representation (embedding) and text generation into a single model achieving state-of-the-art performance on both types of tasks.","release_date":"2024-02-11","context_window":32768,"license":"apache-2.0","tagline":"> GritLM is a generative representational instruction tuned language model.","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"h2oai/h2ogpt-4096-llama2-7b-chat","name":"h2ogpt-4096-llama2-7b-chat","created_by":"h2oai","source":"official","description":"h2oGPT clone of [Meta's Llama 2 7B Chat](https://huggingface.co/meta-llama/Llama-2-7b-chat-hf).","release_date":"2023-08-09","context_window":4096,"license":"llama2","parameters":6.7,"page_url":"https://huggingface.co/h2oai/h2ogpt-4096-llama2-7b-chat","architecture":"transformer","tagline":"h2oGPT clone of [Meta's Llama 2 7B Chat](https://huggingface.co/meta-llama/Llama-2-7b-chat-hf).","capabilities":{"streaming":true,"fine_tuning":true},"open_weight":true,"last_updated":"2026-05-17"},{"id":"huihui-ai/DeepSeek-R1-Distill-Qwen-32B-abliterated","name":"DeepSeek-R1-Distill-Qwen-32B-abliterated","created_by":"huihui-ai","source":"official","description":"This is an uncensored version of [deepseek-ai/DeepSeek-R1-Distill-Qwen-32B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B) created with abliteration (see [remove-refusals-with-transformers](https://github.com/Sumandora/remove-refusals-with-transformers) to know more about it). This is a crude, proof-of-concept implementation to remove refusals from an LLM model without using TransformerLens.","release_date":"2025-01-22","context_window":131072,"parameters":33,"page_url":"https://huggingface.co/huihui-ai/DeepSeek-R1-Distill-Qwen-32B-abliterated","architecture":"transformer","model_type":"reasoning","tagline":"This is an uncensored version of [deepseek-ai/DeepSeek-R1-Distill-Qwen-32B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B) created with abliteration (see [remove-refusals-with-transformers](https://github.com/Sumandora/remove-refusals-with-transformers) to know more about it).","capabilities":{"streaming":true,"tool_call":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-14"},{"id":"huihui-ai/Qwen2.5-14B-Instruct-abliterated-v2","name":"Qwen2.5-14B-Instruct-abliterated-v2","created_by":"huihui-ai","source":"official","description":"This is an uncensored version of [Qwen2.5-14B-Instruct](https://huggingface.co/Qwen/Qwen2.5-14B-Instruct) created with abliteration (see [this article](https://huggingface.co/blog/mlabonne/abliteration) to know more about it).","release_date":"2024-10-09","context_window":32768,"license":"apache-2.0","parameters":15,"page_url":"https://huggingface.co/huihui-ai/Qwen2.5-14B-Instruct-abliterated-v2","architecture":"transformer","model_type":"chat","tagline":"This is an uncensored version of [Qwen2.5-14B-Instruct](https://huggingface.co/Qwen/Qwen2.5-14B-Instruct) created with abliteration (see [this article](https://huggingface.co/blog/mlabonne/abliteratio","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-21"},{"id":"huihui-ai/Qwen2.5-14B-Instruct-abliterated","name":"Qwen2.5-14B-Instruct-abliterated","created_by":"huihui-ai","source":"official","description":"This is an uncensored version of [Qwen/Qwen2.5-14B-Instruct](https://huggingface.co/Qwen/Qwen2.5-14B-Instruct) created with abliteration (see [this article](https://huggingface.co/blog/mlabonne/abliteration) to know more about it).","release_date":"2024-09-25","context_window":32768,"license":"apache-2.0","parameters":15,"page_url":"https://huggingface.co/huihui-ai/Qwen2.5-14B-Instruct-abliterated","architecture":"transformer","model_type":"chat","tagline":"This is an uncensored version of [Qwen/Qwen2.5-14B-Instruct](https://huggingface.co/Qwen/Qwen2.5-14B-Instruct) created with abliteration (see [this article](https://huggingface.co/blog/mlabonne/ablite","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-23"},{"id":"huihui-ai/Qwen2.5-72B-Instruct-abliterated","name":"Qwen2.5-72B-Instruct-abliterated","created_by":"huihui-ai","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":73,"page_url":"https://huggingface.co/huihui-ai/Qwen2.5-72B-Instruct-abliterated","description":"This is an uncensored version of [Qwen/Qwen2.5-72B-Instruct](https://huggingface.co/Qwen/Qwen2.5-72B-Instruct) created with abliteration (see [remove-refusals-with-transformers](https://github.com/Sumandora/remove-refusals-with-transformers) to know more about it). This is a crude, proof-of-concept implementation to remove refusals from an LLM model without using TransformerLens.","release_date":"2024-10-26","context_window":32768,"license":"other","tagline":"This is an uncensored version of [Qwen/Qwen2.5-72B-Instruct](https://huggingface.co/Qwen/Qwen2.5-72B-Instruct) created with abliteration (see [remove-refusals-with-transformers](https://github.com/Sumandora/remove-refusals-with-transformers) to know more about it).","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"instruction-pretrain/finance-Llama3-8B","name":"finance-Llama3-8B","created_by":"instruction-pretrain","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"fine_tuning":true},"parameters":8,"page_url":"https://huggingface.co/instruction-pretrain/finance-Llama3-8B","description":"This repo contains the **finance model developed from Llama3-8B** in our paper [Instruction Pre-Training: Language Models are Supervised Multitask Learners](https://huggingface.co/papers/2406.14491).","release_date":"2024-06-18","context_window":8192,"license":"llama3","tagline":"This repo contains the **finance model developed from Llama3-8B** in our paper [Instruction Pre-Training: Language Models are Supervised Multitask Learners](https://huggingface.co/papers/2406.14491).","architecture":"transformer","open_weight":true},{"id":"Intel/neural-chat-7b-v3-3","name":"neural-chat-7b-v3-3","created_by":"intel","source":"official","last_updated":"2026-03-22","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":7.2,"page_url":"https://huggingface.co/Intel/neural-chat-7b-v3-3","release_date":"2023-12-09","context_window":32768,"license":"apache-2.0"},{"id":"invalid-coder/Sakura-SOLAR-Instruct-CarbonVillain-en-10.7B-v2-slerp","name":"Sakura-SOLAR-Instruct-CarbonVillain-en-10.7B-v2-slerp","created_by":"invalid-coder","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":11,"page_url":"https://huggingface.co/invalid-coder/Sakura-SOLAR-Instruct-CarbonVillain-en-10.7B-v2-slerp","description":"NeuralPipe-7B-slerp is a merge of the following models using [LazyMergekit](https://colab.research.google.com/drive/1obulZ1ROXHjYLn6PPZJwRR6GzgQogxxb?usp=sharing): * [jeonsworld/CarbonVillain-en-10.7B-v2](https://huggingface.co/jeonsworld/CarbonVillain-en-10.7B-v2) * [kyujinpy/Sakura-SOLAR-Instruct](https://huggingface.co/kyujinpy/Sakura-SOLAR-Instruct)","release_date":"2024-01-10","context_window":4096,"license":"apache-2.0","tagline":"NeuralPipe-7B-slerp is a merge of the following models using [LazyMergekit](https://colab.research.google.com/drive/1obulZ1ROXHjYLn6PPZJwRR6GzgQogxxb?usp=sharing): * [jeonsworld/CarbonVillain-en-10.7B","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"kakaocorp/kanana-1.5-8b-instruct-2505","name":"kanana-1.5-8b-instruct-2505","created_by":"kakaocorp","source":"official","release_date":"2025-05-21","context_window":32768,"license":"apache-2.0","alias":"kakaocorp/kanana-1.5-8b-instruct","page_url":"https://huggingface.co/kakaocorp/kanana-1.5-8b-instruct-2505","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-06-10"},{"id":"kakaocorp/kanana-1.5-8b-instruct","name":"kanana-1.5-8b-instruct-2505","created_by":"kakaocorp","source":"official","release_date":"2025-05-21","context_window":32768,"license":"apache-2.0","page_url":"https://huggingface.co/kakaocorp/kanana-1.5-8b-instruct-2505","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"snapshots":["kakaocorp/kanana-1.5-8b-instruct-2505"],"last_updated":"2026-06-10"},{"id":"llmfan46/Gemma-4-Garnet-V2-31B-it-ultra-uncensored-heretic","name":"Gemma-4-Garnet-V2-31B-it-ultra-uncensored-heretic","created_by":"llmfan46","source":"official","release_date":"2026-04-25","license":"apache-2.0","parameters":31,"page_url":"https://huggingface.co/llmfan46/Gemma-4-Garnet-V2-31B-it-ultra-uncensored-heretic","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"lmstudio-community/Qwen3-1.7B-MLX-bf16","name":"Qwen3-1.7B-MLX-bf16","created_by":"lmstudio-community","source":"official","description":"This model [lmstudio-community/Qwen3-1.7B-MLX-bf16](https://huggingface.co/lmstudio-community/Qwen3-1.7B-MLX-bf16) was converted to MLX format from [Qwen/Qwen3-1.7B](https://huggingface.co/Qwen/Qwen3-1.7B) using mlx-lm version **0.24.0**.","release_date":"2025-04-28","context_window":40960,"license":"apache-2.0","parameters":1.7,"page_url":"https://huggingface.co/lmstudio-community/Qwen3-1.7B-MLX-bf16","architecture":"transformer","model_type":"chat","tagline":"This model [lmstudio-community/Qwen3-1.7B-MLX-bf16](https://huggingface.co/lmstudio-community/Qwen3-1.7B-MLX-bf16) was converted to MLX format from [Qwen/Qwen3-1.7B](https://huggingface.co/Qwen/Qwen3-","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"m8than/Mistral-Nemo-Instruct-2407-lenient-chatfix","name":"Mistral-Nemo-Instruct-2407-lenient-chatfix","created_by":"m8than","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","page_url":"https://huggingface.co/m8than/Mistral-Nemo-Instruct-2407-lenient-chatfix","description":"It's just mistral nemo 2407 with a less strict chat format.","release_date":"2025-05-06","context_window":131072,"license":"apache-2.0","parameters":12,"tagline":"It's just mistral nemo 2407 with a less strict chat format.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"meta-llama/Llama-2-13b-chat-hf","name":"Llama-2-13b-chat-hf","created_by":"meta","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-2","model_type":"chat","parameters":13,"page_url":"https://huggingface.co/meta-llama/Llama-2-13b-chat-hf","release_date":"2023-07-13","license":"llama2","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"context_window":4096,"max_output_tokens":4096},{"id":"meta-llama/Llama-3.1-70B-Instruct","name":"Llama-3.1-70B-Instruct","created_by":"meta","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.1","model_type":"chat","parameters":71,"page_url":"https://huggingface.co/meta-llama/Llama-3.1-70B-Instruct","release_date":"2024-07-16","license":"llama3.1","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":131072,"knowledge_cutoff":"2023-12"},{"id":"meta-llama/Llama-3.1-8B-Instruct","name":"Llama-3.1-8B-Instruct","created_by":"meta","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.1","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct","release_date":"2024-07-18","license":"llama3.1","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":131072,"knowledge_cutoff":"2023-12"},{"id":"meta-llama/Llama-3.2-1B-Instruct","name":"Llama-3.2-1B-Instruct","created_by":"meta","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.2","model_type":"chat","parameters":1.2,"page_url":"https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct","release_date":"2024-09-18","license":"llama3.2","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":131072,"knowledge_cutoff":"2023-12"},{"id":"meta-llama/Llama-3.2-3B-Instruct","name":"Llama-3.2-3B-Instruct","created_by":"meta","source":"official","family":"Llama-3.2","release_date":"2024-09-18","license":"llama3.2","parameters":3.2,"page_url":"https://huggingface.co/meta-llama/Llama-3.2-3B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-14","context_window":131072,"max_output_tokens":131072,"knowledge_cutoff":"2023-12"},{"id":"meta-llama/Llama-3.3-70B-Instruct","name":"Llama-3.3-70B-Instruct","created_by":"meta","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.3","model_type":"chat","parameters":71,"page_url":"https://huggingface.co/meta-llama/Llama-3.3-70B-Instruct","release_date":"2024-11-26","license":"llama3.3","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":131072,"knowledge_cutoff":"2023-12"},{"id":"meta-llama/Meta-Llama-3-70B-Instruct","name":"Meta-Llama-3-70B-Instruct","created_by":"meta","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":71,"page_url":"https://huggingface.co/meta-llama/Meta-Llama-3-70B-Instruct","release_date":"2024-04-17","license":"llama3","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"context_window":8192,"max_output_tokens":8192},{"id":"meta-llama/Meta-Llama-3-8B-Instruct","name":"Meta-Llama-3-8B-Instruct","created_by":"meta","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/meta-llama/Meta-Llama-3-8B-Instruct","release_date":"2024-04-17","license":"llama3","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"context_window":8192,"max_output_tokens":8192},{"id":"microsoft/Phi-3-mini-128k-instruct","name":"Phi-3-mini-128k-instruct","created_by":"microsoft","source":"official","description":"🎉**Phi-4**: [[multimodal-instruct](https://huggingface.co/microsoft/Phi-4-multimodal-instruct) | [onnx](https://huggingface.co/microsoft/Phi-4-multimodal-instruct-onnx)]; [[mini-instruct](https://huggingface.co/microsoft/Phi-4-mini-instruct) | [onnx](https://huggingface.co/microsoft/Phi-4-mini-instruct-onnx)]","release_date":"2024-04-22","context_window":131072,"license":"mit","parameters":3.8,"page_url":"https://huggingface.co/microsoft/Phi-3-mini-128k-instruct","architecture":"transformer","model_type":"chat","tagline":"🎉**Phi-4**: [[multimodal-instruct](https://huggingface.co/microsoft/Phi-4-multimodal-instruct) | [onnx](https://huggingface.co/microsoft/Phi-4-multimodal-instruct-onnx)]; [[mini-instruct](https://hug","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"microsoft/Phi-3-mini-4k-instruct","name":"Phi-3-mini-4k-instruct","created_by":"microsoft","source":"official","description":"🎉 **Phi-3.5**: [[mini-instruct]](https://huggingface.co/microsoft/Phi-3.5-mini-instruct); [[MoE-instruct]](https://huggingface.co/microsoft/Phi-3.5-MoE-instruct) ; [[vision-instruct]](https://huggingface.co/microsoft/Phi-3.5-vision-instruct)","release_date":"2024-04-22","context_window":4096,"license":"mit","parameters":3.8,"page_url":"https://huggingface.co/microsoft/Phi-3-mini-4k-instruct","architecture":"transformer","model_type":"chat","tagline":"🎉 **Phi-3.5**: [[mini-instruct]](https://huggingface.co/microsoft/Phi-3.5-mini-instruct); [[MoE-instruct]](https://huggingface.co/microsoft/Phi-3.5-MoE-instruct) ; [[vision-instruct]](https://hugging","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"microsoft/Phi-4-mini-instruct","name":"Phi-4-mini-instruct","created_by":"microsoft","source":"official","description":"🎉**Phi-4**: [[mini-reasoning](https://huggingface.co/microsoft/Phi-4-mini-reasoning) | [reasoning](https://huggingface.co/microsoft/Phi-4-reasoning)] | [[multimodal-instruct](https://huggingface.co/microsoft/Phi-4-multimodal-instruct) | [onnx](https://huggingface.co/microsoft/Phi-4-multimodal-instruct-onnx)]; [[mini-instruct](https://huggingface.co/microsoft/Phi-4-mini-instruct) | [onnx](https://huggingface.co/microsoft/Phi-4-mini-instruct-onnx)]","release_date":"2025-02-19","context_window":131072,"license":"mit","page_url":"https://huggingface.co/microsoft/Phi-4-mini-instruct","architecture":"transformer","model_type":"chat","tagline":"🎉**Phi-4**: [[mini-reasoning](https://huggingface.co/microsoft/Phi-4-mini-reasoning) | [reasoning](https://huggingface.co/microsoft/Phi-4-reasoning)] | [[multimodal-instruct](https://huggingface.co/m","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29","parameters":3.8},{"id":"mistralai/Mistral-7B-Instruct-v0.1","name":"Mistral-7B-Instruct-v0.1","created_by":"mistral","source":"official","release_date":"2023-09-27","context_window":32768,"license":"apache-2.0","page_url":"https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-23","parameters":7.2},{"id":"mistralai/Mistral-7B-Instruct-v0.2","name":"Mistral-7B-Instruct-v0.2","created_by":"mistral","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":7.2,"page_url":"https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2","release_date":"2023-12-11","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"mlabonne/Meta-Llama-3.1-8B-Instruct-abliterated","name":"Meta-Llama-3.1-8B-Instruct-abliterated","created_by":"mlabonne","source":"official","last_updated":"2026-03-24","family":"Llama-3.1","page_url":"https://huggingface.co/mlabonne/Meta-Llama-3.1-8B-Instruct-abliterated","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"description":"This is an uncensored version of Llama 3.1 8B Instruct created with abliteration (see [this article](https://huggingface.co/blog/mlabonne/abliteration) to know more about it).","release_date":"2024-07-24","context_window":131072,"license":"llama3.1","parameters":8,"tagline":"This is an uncensored version of Llama 3.1 8B Instruct created with abliteration (see [this article](https://huggingface.co/blog/mlabonne/abliteration) to know more about it).","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"mlabonne/NeuralDaredevil-8B-abliterated","name":"NeuralDaredevil-8B-abliterated","created_by":"mlabonne","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":8,"page_url":"https://huggingface.co/mlabonne/NeuralDaredevil-8B-abliterated","description":"This is a DPO fine-tune of [mlabonne/Daredevil-8-abliterated](https://huggingface.co/mlabonne/Daredevil-8B-abliterated), trained on one epoch of [mlabonne/orpo-dpo-mix-40k](https://huggingface.co/datasets/mlabonne/orpo-dpo-mix-40k). The DPO fine-tuning successfully recovers the performance loss due to the abliteration process, making it an excellent uncensored model.","release_date":"2024-05-27","context_window":8192,"license":"llama3","tagline":"This is a DPO fine-tune of [mlabonne/Daredevil-8-abliterated](https://huggingface.co/mlabonne/Daredevil-8B-abliterated), trained on one epoch of [mlabonne/orpo-dpo-mix-40k](https://huggingface.co/datasets/mlabonne/orpo-dpo-mix-40k).","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"moonshotai/Kimi-K2-Instruct-0905","name":"Kimi-K2-Instruct-0905","created_by":"moonshot","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Kimi-K2","model_type":"chat","page_url":"https://huggingface.co/moonshotai/Kimi-K2-Instruct-0905","release_date":"2025-09-03","context_window":262144,"license":"other","parameters":1026,"architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"moonshotai/Kimi-K2-Instruct","name":"Kimi-K2-Instruct","created_by":"moonshot","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Kimi-K2","model_type":"chat","page_url":"https://huggingface.co/moonshotai/Kimi-K2-Instruct","release_date":"2025-07-11","context_window":131072,"license":"other","parameters":1026,"architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"moonshotai/Kimi-K2-Thinking","name":"Kimi-K2-Thinking","created_by":"moonshot","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true},"family":"Kimi-K2","model_type":"chat","page_url":"https://huggingface.co/moonshotai/Kimi-K2-Thinking","release_date":"2025-11-04","context_window":262144,"license":"other","parameters":1058,"architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Long-term thinking, multi-step tool usage, complex problem solving.","tagline":"Long-term thinking, multi-step tool usage, complex problem solving.","max_output_tokens":32768},{"id":"moonshotai/Kimi-Linear-48B-A3B-Instruct","name":"Kimi-Linear-48B-A3B-Instruct","created_by":"moonshot","source":"official","family":"kimi","release_date":"2025-10-30","license":"mit","parameters":49,"page_url":"https://huggingface.co/moonshotai/Kimi-Linear-48B-A3B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"NousResearch/Meta-Llama-3-70B-Instruct","name":"Meta-Llama-3-70B-Instruct","created_by":"nousresearch","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":71,"page_url":"https://huggingface.co/NousResearch/Meta-Llama-3-70B-Instruct","release_date":"2024-04-19","context_window":8192,"license":"other","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"NousResearch/Meta-Llama-3-8B-Instruct","name":"Meta-Llama-3-8B-Instruct","created_by":"nousresearch","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/NousResearch/Meta-Llama-3-8B-Instruct","release_date":"2024-04-18","context_window":8192,"license":"other","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"NousResearch/Meta-Llama-3.1-8B-Instruct","name":"Meta-Llama-3.1-8B-Instruct","created_by":"nousresearch","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.1","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/NousResearch/Meta-Llama-3.1-8B-Instruct","release_date":"2024-07-24","context_window":131072,"license":"llama3.1","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"nvidia/Gemma-4-31B-IT-NVFP4","name":"Gemma-4-31B-IT-NVFP4","created_by":"nvidia","source":"official","release_date":"2026-04-02","license":"other","parameters":21,"page_url":"https://huggingface.co/nvidia/Gemma-4-31B-IT-NVFP4","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-14"},{"id":"nvidia/Llama-3.1-8B-Instruct-FP8","name":"Llama-3.1-8B-Instruct-FP8","created_by":"nvidia","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.1","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/nvidia/Llama-3.1-8B-Instruct-FP8","release_date":"2024-08-29","context_window":131072,"license":"llama3.1","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"openai/gpt-oss-120b","name":"gpt-oss-120b","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-oss","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"structured_output":true,"reasoning":true,"json_mode":true,"vision":false,"batch":true},"model_type":"chat","parameters":120,"page_url":"https://huggingface.co/openai/gpt-oss-120b","description":"Welcome to the gpt-oss series, [OpenAI’s open-weight models](https://openai.com/open-models) designed for powerful reasoning, agentic tasks, and versatile developer use cases.","release_date":"2025-08-04","context_window":131072,"license":"apache-2.0","tagline":"Welcome to the gpt-oss series, [OpenAI’s open-weight models](https://openai.com/open-models) designed for powerful reasoning, agentic tasks, and versatile developer use cases.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"max_output_tokens":131072,"knowledge_cutoff":"2024-06"},{"id":"openai/gpt-oss-20b","name":"gpt-oss-20b","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-oss","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"structured_output":true,"reasoning":true,"json_mode":true,"vision":false,"batch":true},"model_type":"chat","parameters":22,"page_url":"https://huggingface.co/openai/gpt-oss-20b","description":"Welcome to the gpt-oss series, [OpenAI’s open-weight models](https://openai.com/open-models) designed for powerful reasoning, agentic tasks, and versatile developer use cases.","release_date":"2025-08-04","context_window":131072,"license":"apache-2.0","tagline":"Welcome to the gpt-oss series, [OpenAI’s open-weight models](https://openai.com/open-models) designed for powerful reasoning, agentic tasks, and versatile developer use cases.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"max_output_tokens":131072,"knowledge_cutoff":"2024-06"},{"id":"openai/gpt-oss-safeguard-20b","name":"gpt-oss-safeguard-20b","created_by":"openai","source":"official","last_updated":"2026-05-29","family":"gpt-oss","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"moderation","parameters":22,"page_url":"https://huggingface.co/openai/gpt-oss-safeguard-20b","description":"`gpt-oss-safeguard-120b` and `gpt-oss-safeguard-20b` are safety reasoning models built-upon gpt-oss. With these models, you can classify text content based on safety policies that you provide and perform a suite of foundational safety tasks. These models are intended for safety use cases. For other applications, we recommend using [gpt-oss models](https://huggingface.co/collections/openai/gpt-oss).","release_date":"2025-09-18","context_window":131072,"license":"apache-2.0","tagline":"`gpt-oss-safeguard-120b` and `gpt-oss-safeguard-20b` are safety reasoning models built-upon gpt-oss.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"openchat/openchat-3.6-8b-20240522","name":"openchat-3.6-8b-20240522","created_by":"openchat","source":"official","last_updated":"2026-03-24","alias":"openchat/openchat-3.6-8b","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":8,"page_url":"https://huggingface.co/openchat/openchat-3.6-8b-20240522","description":"To use this model, we highly recommend installing the OpenChat package by following the [installation guide](https://github.com/imoneoi/openchat#installation) in our repository and using the OpenChat OpenAI-compatible API server by running the serving command from the table below. The server is optimized for high-throughput deployment using [vLLM](https://github.com/vllm-project/vllm) and can run on a consumer GPU with 24GB RAM.","release_date":"2024-05-07","context_window":8192,"license":"llama3","tagline":"To use this model, we highly recommend installing the OpenChat package by following the [installation guide](https://github.com/imoneoi/openchat#installation) in our repository and using the OpenChat OpenAI-compatible API server by running the serving command from the table below.","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"openchat/openchat-3.6-8b","name":"openchat-3.6-8b-20240522","created_by":"openchat","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"snapshots":["openchat/openchat-3.6-8b-20240522"],"parameters":8,"page_url":"https://huggingface.co/openchat/openchat-3.6-8b-20240522","description":"To use this model, we highly recommend installing the OpenChat package by following the [installation guide](https://github.com/imoneoi/openchat#installation) in our repository and using the OpenChat OpenAI-compatible API server by running the serving command from the table below. The server is optimized for high-throughput deployment using [vLLM](https://github.com/vllm-project/vllm) and can run on a consumer GPU with 24GB RAM.","release_date":"2024-05-07","context_window":8192,"license":"llama3","tagline":"To use this model, we highly recommend installing the OpenChat package by following the [installation guide](https://github.com/imoneoi/openchat#installation) in our repository and using the OpenChat OpenAI-compatible API server by running the serving command from the table below.","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"openchat/openchat_3.5","name":"openchat_3.5","created_by":"openchat","source":"official","description":"**🔥 The first 7B model Achieves Comparable Results with ChatGPT (March)! 🔥**","release_date":"2023-10-30","context_window":8192,"license":"apache-2.0","page_url":"https://huggingface.co/openchat/openchat_3.5","architecture":"transformer","tagline":"**🔥 The first 7B model Achieves Comparable Results with ChatGPT (March)! 🔥**","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"OpenPipe/Qwen3-14B-Instruct","name":"Qwen3-14B-Instruct","created_by":"openpipe","source":"official","release_date":"2025-10-10","context_window":40960,"license":"apache-2.0","parameters":15,"page_url":"https://huggingface.co/OpenPipe/Qwen3-14B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Orion-zhen/Qwen2.5-7B-Instruct-Uncensored","name":"Qwen2.5-7B-Instruct-Uncensored","created_by":"orion-zhen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":7.6,"page_url":"https://huggingface.co/Orion-zhen/Qwen2.5-7B-Instruct-Uncensored","description":"This model is an uncensored fine-tune version of Qwen2.5-7B-Instruct. However, I can still notice that though uncensored, the model fails to generate detailed descriptions on certain extreme scenarios, which might be associated with deletion on some pretrain datasets in Qwen's pretraining stage.","release_date":"2024-09-26","context_window":32768,"license":"gpl-3.0","tagline":"This model is an uncensored fine-tune version of Qwen2.5-7B-Instruct.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"PatronusAI/Llama-3-Patronus-Lynx-8B-Instruct-v1.1","name":"Llama-3-Patronus-Lynx-8B-Instruct-v1.1","created_by":"patronusai","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/PatronusAI/Llama-3-Patronus-Lynx-8B-Instruct-v1.1","description":"Lynx is an open-source hallucination evaluation model. Patronus-Lynx-8B-Instruct-v1.1 was trained on a mix of datasets including CovidQA, PubmedQA, DROP, RAGTruth. The datasets contain a mix of hand-annotated and synthetic data. The maximum sequence length is 128000 tokens.","release_date":"2024-07-24","context_window":131072,"license":"cc-by-nc-4.0","tagline":"Lynx is an open-source hallucination evaluation model.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"prefeitura-rio/Rio-3.0-Open-Mini","name":"Rio-3.0-Open-Mini","created_by":"prefeitura-rio","source":"official","description":"**Rio 3.0 Open Mini** is a frontier-class reasoning model developed by [IplanRIO](https://iplanrio.rio.rj.gov.br/), the municipal IT company of Rio de Janeiro's city government. Built through distillation on top of Qwen3-4B-Thinking-2507 using reasoning traces from our to be announced Rio 3.0 model, Rio 3.0 Open achieves state-of-the-art results across mathematics, STEM, and code benchmarks — surpassing its base model by significant margins and competing with models far larger than itself.","release_date":"2026-02-09","context_window":262144,"license":"mit","parameters":4,"page_url":"https://huggingface.co/prefeitura-rio/Rio-3.0-Open-Mini","architecture":"transformer","tagline":"**Rio 3.0 Open Mini** is a frontier-class reasoning model developed by [IplanRIO](https://iplanrio.rio.rj.gov.br/), the municipal IT company of Rio de Janeiro's city government.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen1.5-0.5B-Chat","name":"Qwen1.5-0.5B-Chat","created_by":"qwen","source":"official","release_date":"2024-01-31","context_window":32768,"license":"other","parameters":0.62,"page_url":"https://huggingface.co/Qwen/Qwen1.5-0.5B-Chat","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen1.5-1.8B-Chat","name":"Qwen1.5-1.8B-Chat","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":1.8,"page_url":"https://huggingface.co/Qwen/Qwen1.5-1.8B-Chat","release_date":"2024-01-30","context_window":32768,"license":"other","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2-0.5B-Instruct","name":"Qwen2-0.5B-Instruct","created_by":"qwen","source":"official","release_date":"2024-06-03","context_window":32768,"license":"apache-2.0","parameters":0.49,"page_url":"https://huggingface.co/Qwen/Qwen2-0.5B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen2-1.5B-Instruct","name":"Qwen2-1.5B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":1.5,"page_url":"https://huggingface.co/Qwen/Qwen2-1.5B-Instruct","release_date":"2024-06-03","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2-72B-Instruct","name":"Qwen2-72B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":73,"page_url":"https://huggingface.co/Qwen/Qwen2-72B-Instruct","release_date":"2024-05-28","context_window":32768,"license":"other","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Alibaba Cloud's Qwen2 open-source version. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt)","tagline":"The Qwen2 open-source model from Alibaba Cloud.","max_output_tokens":6144},{"id":"Qwen/Qwen2-7B-Instruct","name":"Qwen2-7B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":7.6,"page_url":"https://huggingface.co/Qwen/Qwen2-7B-Instruct","release_date":"2024-06-04","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Alibaba Cloud's Qwen2 open-source version. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt)","tagline":"The Qwen2 open-source model from Alibaba Cloud."},{"id":"Qwen/Qwen2.5-0.5B-Instruct","name":"Qwen2.5-0.5B-Instruct","created_by":"qwen","source":"official","release_date":"2024-09-16","context_window":32768,"license":"apache-2.0","parameters":0.49,"page_url":"https://huggingface.co/Qwen/Qwen2.5-0.5B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen2.5-1.5B-Instruct","name":"Qwen2.5-1.5B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":1.5,"page_url":"https://huggingface.co/Qwen/Qwen2.5-1.5B-Instruct","release_date":"2024-09-17","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-14B-Instruct-1M","name":"Qwen2.5-14B-Instruct-1M","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen2.5-14B-Instruct-1M","release_date":"2025-01-23","context_window":1010000,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Qwen2.5 is part of the Qwen Large Language Model (LLM) series. We released a series of base language models and instruction-tuned language models with parameter scales ranging from 7 billion to 72 billion. Qwen2.5 improves upon Qwen2 in the following ways: * Pre-trained on our latest large-scale dataset containing up to 18 trillion tokens. * Significantly expanded knowledge and greatly enhanced coding and math capabilities due to our domain-expert models. * Major improvements in instruction following, long-text generation (over 8K tokens), structured data understanding (such as tables), and structured output generation (especially JSON). More resilient to diverse system prompts, enhancing chatbot role-playing and conditional setup. * Supports over 29 languages, including Chinese, English, French, Spanish, Portuguese, German, Italian, Russian, Japanese, Korean, Vietnamese, Thai, and Arabic. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt) ## International If you select the [International](https://www.alibabacloud.com/help/en/document_detail/3004398.html#080da663a75xh) deployment scope, model inference compute resources are dynamically scheduled worldwide, excluding the Chinese mainland. Static data is stored in your selected region. Supported region: Singapore.","tagline":"Qwen2.5 is a large language model series from Qwen.","max_output_tokens":8192},{"id":"Qwen/Qwen2.5-14B-Instruct","name":"Qwen2.5-14B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen2.5-14B-Instruct","release_date":"2024-09-16","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Qwen2.5 is part of the Qwen Large Language Model (LLM) series. We released a series of base language models and instruction-tuned language models with parameter scales ranging from 7 billion to 72 billion. Qwen2.5 improves upon Qwen2 in the following ways: * Pre-trained on our latest large-scale dataset containing up to 18 trillion tokens. * Significantly expanded knowledge and greatly enhanced coding and math capabilities due to our domain-expert models. * Major improvements in instruction following, long-text generation (over 8K tokens), structured data understanding (such as tables), and structured output generation (especially JSON). More resilient to diverse system prompts, enhancing chatbot role-playing and conditional setup. * Supports over 29 languages, including Chinese, English, French, Spanish, Portuguese, German, Italian, Russian, Japanese, Korean, Vietnamese, Thai, and Arabic. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt) ## International If you select the [International](https://www.alibabacloud.com/help/en/document_detail/3004398.html#080da663a75xh) deployment scope, model inference compute resources are dynamically scheduled worldwide, excluding the Chinese mainland. Static data is stored in your selected region. Supported region: Singapore.","tagline":"Qwen2.5 is a large language model series from Qwen."},{"id":"Qwen/Qwen2.5-32B-Instruct","name":"Qwen2.5-32B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":33,"page_url":"https://huggingface.co/Qwen/Qwen2.5-32B-Instruct","release_date":"2024-09-17","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Qwen2.5 is part of the Qwen Large Language Model (LLM) series. We released a series of base language models and instruction-tuned language models with parameter scales ranging from 7 billion to 72 billion. Qwen2.5 improves upon Qwen2 in the following ways: * Pre-trained on our latest large-scale dataset containing up to 18 trillion tokens. * Significantly expanded knowledge and greatly enhanced coding and math capabilities due to our domain-expert models. * Major improvements in instruction following, long-text generation (over 8K tokens), structured data understanding (such as tables), and structured output generation (especially JSON). More resilient to diverse system prompts, enhancing chatbot role-playing and conditional setup. * Supports over 29 languages, including Chinese, English, French, Spanish, Portuguese, German, Italian, Russian, Japanese, Korean, Vietnamese, Thai, and Arabic. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt) ## International If you select the [International](https://www.alibabacloud.com/help/en/document_detail/3004398.html#080da663a75xh) deployment scope, model inference compute resources are dynamically scheduled worldwide, excluding the Chinese mainland. Static data is stored in your selected region. Supported region: Singapore.","tagline":"Qwen2.5 is a large language model series from Qwen."},{"id":"Qwen/Qwen2.5-3B-Instruct","name":"Qwen2.5-3B-Instruct","created_by":"qwen","source":"official","release_date":"2024-09-17","context_window":32768,"license":"other","parameters":3.1,"page_url":"https://huggingface.co/Qwen/Qwen2.5-3B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen2.5-72B-Instruct","name":"Qwen2.5-72B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":73,"page_url":"https://huggingface.co/Qwen/Qwen2.5-72B-Instruct","release_date":"2024-09-16","context_window":32768,"license":"other","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Qwen2.5 is part of the Qwen Large Language Model (LLM) series. We released a series of base language models and instruction-tuned language models with parameter scales ranging from 7 billion to 72 billion. Qwen2.5 improves upon Qwen2 in the following ways: * Pre-trained on our latest large-scale dataset containing up to 18 trillion tokens. * Significantly expanded knowledge and greatly enhanced coding and math capabilities due to our domain-expert models. * Major improvements in instruction following, long-text generation (over 8K tokens), structured data understanding (such as tables), and structured output generation (especially JSON). More resilient to diverse system prompts, enhancing chatbot role-playing and conditional setup. * Supports over 29 languages, including Chinese, English, French, Spanish, Portuguese, German, Italian, Russian, Japanese, Korean, Vietnamese, Thai, and Arabic. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt) ## International If you select the [International](https://www.alibabacloud.com/help/en/document_detail/3004398.html#080da663a75xh) deployment scope, model inference compute resources are dynamically scheduled worldwide, excluding the Chinese mainland. Static data is stored in your selected region. Supported region: Singapore.","tagline":"Qwen2.5 is a large language model series from Qwen."},{"id":"Qwen/Qwen2.5-7B-Instruct-1M","name":"Qwen2.5-7B-Instruct-1M","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":7.6,"page_url":"https://huggingface.co/Qwen/Qwen2.5-7B-Instruct-1M","release_date":"2025-01-23","context_window":1010000,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Qwen2.5 is part of the Qwen Large Language Model (LLM) series. We released a series of base language models and instruction-tuned language models with parameter scales ranging from 7 billion to 72 billion. Qwen2.5 improves upon Qwen2 in the following ways: * Pre-trained on our latest large-scale dataset containing up to 18 trillion tokens. * Significantly expanded knowledge and greatly enhanced coding and math capabilities due to our domain-expert models. * Major improvements in instruction following, long-text generation (over 8K tokens), structured data understanding (such as tables), and structured output generation (especially JSON). More resilient to diverse system prompts, enhancing chatbot role-playing and conditional setup. * Supports over 29 languages, including Chinese, English, French, Spanish, Portuguese, German, Italian, Russian, Japanese, Korean, Vietnamese, Thai, and Arabic. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt) ## International If you select the [International](https://www.alibabacloud.com/help/en/document_detail/3004398.html#080da663a75xh) deployment scope, model inference compute resources are dynamically scheduled worldwide, excluding the Chinese mainland. Static data is stored in your selected region. Supported region: Singapore.","tagline":"Qwen2.5 is a large language model series from Qwen."},{"id":"Qwen/Qwen2.5-7B-Instruct","name":"Qwen2.5-7B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":7.6,"page_url":"https://huggingface.co/Qwen/Qwen2.5-7B-Instruct","release_date":"2024-09-16","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Qwen2.5 is part of the Qwen Large Language Model (LLM) series. We released a series of base language models and instruction-tuned language models with parameter scales ranging from 7 billion to 72 billion. Qwen2.5 improves upon Qwen2 in the following ways: * Pre-trained on our latest large-scale dataset containing up to 18 trillion tokens. * Significantly expanded knowledge and greatly enhanced coding and math capabilities due to our domain-expert models. * Major improvements in instruction following, long-text generation (over 8K tokens), structured data understanding (such as tables), and structured output generation (especially JSON). More resilient to diverse system prompts, enhancing chatbot role-playing and conditional setup. * Supports over 29 languages, including Chinese, English, French, Spanish, Portuguese, German, Italian, Russian, Japanese, Korean, Vietnamese, Thai, and Arabic. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt) ## International If you select the [International](https://www.alibabacloud.com/help/en/document_detail/3004398.html#080da663a75xh) deployment scope, model inference compute resources are dynamically scheduled worldwide, excluding the Chinese mainland. Static data is stored in your selected region. Supported region: Singapore.","tagline":"Qwen2.5 is a large language model series from Qwen."},{"id":"Qwen/Qwen2.5-Coder-0.5B-Instruct","name":"Qwen2.5-Coder-0.5B-Instruct","created_by":"qwen","source":"official","release_date":"2024-11-06","context_window":32768,"license":"apache-2.0","parameters":0.49,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-0.5B-Instruct","architecture":"transformer","model_type":"code","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen2.5-Coder-0.5B","name":"Qwen2.5-Coder-0.5B","created_by":"qwen","source":"official","release_date":"2024-11-08","context_window":32768,"license":"apache-2.0","parameters":0.49,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-0.5B","architecture":"transformer","model_type":"code","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen2.5-Coder-1.5B-Instruct","name":"Qwen2.5-Coder-1.5B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":1.5,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-1.5B-Instruct","release_date":"2024-09-18","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-1.5B","name":"Qwen2.5-Coder-1.5B","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":1.5,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-1.5B","release_date":"2024-09-18","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-14B-Instruct","name":"Qwen2.5-Coder-14B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-14B-Instruct","release_date":"2024-11-06","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-14B","name":"Qwen2.5-Coder-14B","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-14B","release_date":"2024-11-08","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-32B-Instruct","name":"Qwen2.5-Coder-32B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":33,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-32B-Instruct","release_date":"2024-11-06","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-32B","name":"Qwen2.5-Coder-32B","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":33,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-32B","release_date":"2024-11-08","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-3B-Instruct","name":"Qwen2.5-Coder-3B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":3.1,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-3B-Instruct","release_date":"2024-11-06","context_window":32768,"license":"other","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-3B","name":"Qwen2.5-Coder-3B","created_by":"qwen","source":"official","release_date":"2024-11-08","context_window":32768,"license":"other","parameters":3.1,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-3B","architecture":"transformer","model_type":"code","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen2.5-Coder-7B-Instruct","name":"Qwen2.5-Coder-7B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":7.6,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-7B-Instruct","release_date":"2024-09-17","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-7B","name":"Qwen2.5-Coder-7B","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":7.6,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-7B","release_date":"2024-09-16","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Math-1.5B-Instruct","name":"Qwen2.5-Math-1.5B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":1.5,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Math-1.5B-Instruct","description":"> [!Warning] >
> > 🚨 Qwen2.5-Math mainly supports solving English and Chinese math problems through CoT and TIR. We do not recommend using this series of models for other tasks. > >
","release_date":"2024-09-16","context_window":4096,"license":"apache-2.0","tagline":"> [!Warning] >
> > 🚨 Qwen2.5-Math mainly supports solving English and Chinese math problems through CoT and TIR.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Math-7B-Instruct","name":"Qwen2.5-Math-7B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":7.6,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Math-7B-Instruct","description":"> [!Warning] >
> > 🚨 Qwen2.5-Math mainly supports solving English and Chinese math problems through CoT and TIR. We do not recommend using this series of models for other tasks. > >
","release_date":"2024-09-19","context_window":4096,"license":"apache-2.0","tagline":"> [!Warning] >
> > 🚨 Qwen2.5-Math mainly supports solving English and Chinese math problems through CoT and TIR.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-0.6B-Base","name":"Qwen3-0.6B-Base","created_by":"qwen","source":"official","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","page_url":"https://huggingface.co/Qwen/Qwen3-0.6B-Base","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-23","parameters":0.6},{"id":"Qwen/Qwen3-0.6B","name":"Qwen3-0.6B","created_by":"qwen","source":"official","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","parameters":0.75,"page_url":"https://huggingface.co/Qwen/Qwen3-0.6B","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen3-1.7B-Base","name":"Qwen3-1.7B-Base","created_by":"qwen","source":"official","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","parameters":1.7,"page_url":"https://huggingface.co/Qwen/Qwen3-1.7B-Base","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen3-1.7B","name":"Qwen3-1.7B","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":2,"page_url":"https://huggingface.co/Qwen/Qwen3-1.7B","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-14B-Base","name":"Qwen3-14B-Base","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen3-14B-Base","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-14B","name":"Qwen3-14B","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen3-14B","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-235B-A22B-Instruct-2507","name":"Qwen3-235B-A22B-Instruct-2507","created_by":"qwen","source":"official","last_updated":"2026-05-23","alias":"Qwen/Qwen3-235B-A22B-Instruct","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":235,"active_parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507","release_date":"2025-07-21","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-235B-A22B-Instruct","name":"Qwen3-235B-A22B-Instruct-2507","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"snapshots":["Qwen/Qwen3-235B-A22B-Instruct-2507"],"model_type":"chat","parameters":235,"active_parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507","release_date":"2025-07-21","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-235B-A22B-Thinking-2507","name":"Qwen3-235B-A22B-Thinking-2507","created_by":"qwen","source":"official","last_updated":"2026-05-23","alias":"Qwen/Qwen3-235B-A22B-Thinking","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":235,"active_parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Thinking-2507","release_date":"2025-07-25","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-235B-A22B-Thinking","name":"Qwen3-235B-A22B-Thinking-2507","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"snapshots":["Qwen/Qwen3-235B-A22B-Thinking-2507"],"model_type":"chat","parameters":235,"active_parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Thinking-2507","release_date":"2025-07-25","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-235B-A22B","name":"Qwen3-235B-A22B","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":235,"active_parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-30B-A3B-Instruct-2507","name":"Qwen3-30B-A3B-Instruct-2507","created_by":"qwen","source":"official","last_updated":"2026-05-23","alias":"Qwen/Qwen3-30B-A3B-Instruct","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":31,"active_parameters":1.9,"page_url":"https://huggingface.co/Qwen/Qwen3-30B-A3B-Instruct-2507","release_date":"2025-07-28","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-30B-A3B-Instruct","name":"Qwen3-30B-A3B-Instruct-2507","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"snapshots":["Qwen/Qwen3-30B-A3B-Instruct-2507"],"model_type":"chat","parameters":31,"active_parameters":1.9,"page_url":"https://huggingface.co/Qwen/Qwen3-30B-A3B-Instruct-2507","release_date":"2025-07-28","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-30B-A3B-Thinking-2507","name":"Qwen3-30B-A3B-Thinking-2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","release_date":"2025-07-29","context_window":262144,"model_type":"chat","license":"apache-2.0","parameters":31,"active_parameters":1.9,"alias":"Qwen/Qwen3-30B-A3B-Thinking","page_url":"https://huggingface.co/Qwen/Qwen3-30B-A3B-Thinking-2507","architecture":"moe","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"open_weight":true,"tools":["function_calling"]},{"id":"Qwen/Qwen3-30B-A3B-Thinking","name":"Qwen3-30B-A3B-Thinking-2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","release_date":"2025-07-29","context_window":262144,"license":"apache-2.0","parameters":31,"active_parameters":1.9,"page_url":"https://huggingface.co/Qwen/Qwen3-30B-A3B-Thinking-2507","architecture":"moe","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"snapshots":["Qwen/Qwen3-30B-A3B-Thinking-2507"]},{"id":"Qwen/Qwen3-30B-A3B","name":"Qwen3-30B-A3B","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":31,"active_parameters":1.9,"page_url":"https://huggingface.co/Qwen/Qwen3-30B-A3B","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-32B","name":"Qwen3-32B","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":33,"page_url":"https://huggingface.co/Qwen/Qwen3-32B","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-4B-Base","name":"Qwen3-4B-Base","created_by":"qwen","source":"official","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","parameters":4,"page_url":"https://huggingface.co/Qwen/Qwen3-4B-Base","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen3-4B-Instruct-2507","name":"Qwen3-4B-Instruct-2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","alias":"Qwen/Qwen3-4B-Instruct","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":4,"page_url":"https://huggingface.co/Qwen/Qwen3-4B-Instruct-2507","release_date":"2025-08-05","context_window":262144,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-4B-Instruct","name":"Qwen3-4B-Instruct-2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"snapshots":["Qwen/Qwen3-4B-Instruct-2507"],"model_type":"chat","parameters":4,"page_url":"https://huggingface.co/Qwen/Qwen3-4B-Instruct-2507","release_date":"2025-08-05","context_window":262144,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-4B-SafeRL","name":"Qwen3-4B-SafeRL","created_by":"qwen","source":"official","release_date":"2025-09-30","context_window":40960,"license":"apache-2.0","parameters":4.4,"page_url":"https://huggingface.co/Qwen/Qwen3-4B-SafeRL","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen3-4B-Thinking-2507","name":"Qwen3-4B-Thinking-2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","alias":"Qwen/Qwen3-4B-Thinking","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":4,"page_url":"https://huggingface.co/Qwen/Qwen3-4B-Thinking-2507","release_date":"2025-08-05","context_window":262144,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-4B-Thinking","name":"Qwen3-4B-Thinking-2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"snapshots":["Qwen/Qwen3-4B-Thinking-2507"],"model_type":"chat","parameters":4,"page_url":"https://huggingface.co/Qwen/Qwen3-4B-Thinking-2507","release_date":"2025-08-05","context_window":262144,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-4B","name":"Qwen3-4B","created_by":"qwen","source":"official","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","page_url":"https://huggingface.co/Qwen/Qwen3-4B","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-23","parameters":4},{"id":"Qwen/Qwen3-8B-Base","name":"Qwen3-8B-Base","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":8.2,"page_url":"https://huggingface.co/Qwen/Qwen3-8B-Base","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-8B","name":"Qwen3-8B","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":8.2,"page_url":"https://huggingface.co/Qwen/Qwen3-8B","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-Coder-30B-A3B-Instruct","name":"Qwen3-Coder-30B-A3B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"code","parameters":31,"active_parameters":1.9,"page_url":"https://huggingface.co/Qwen/Qwen3-Coder-30B-A3B-Instruct","release_date":"2025-07-31","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8","name":"Qwen3-Coder-480B-A35B-Instruct-FP8","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":480,"active_parameters":24,"release_date":"2025-07-22","context_window":262144,"license":"apache-2.0","page_url":"https://huggingface.co/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-Coder-480B-A35B-Instruct","name":"Qwen3-Coder-480B-A35B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"code","parameters":480,"active_parameters":24,"page_url":"https://huggingface.co/Qwen/Qwen3-Coder-480B-A35B-Instruct","release_date":"2025-07-22","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-Coder-Next-FP8","name":"Qwen3-Coder-Next-FP8","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","page_url":"https://huggingface.co/Qwen/Qwen3-Coder-Next-FP8","release_date":"2026-02-01","context_window":262144,"license":"apache-2.0","parameters":80,"active_parameters":1.6,"architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-Coder-Next","name":"Qwen3-Coder-Next","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"code","release_date":"2026-01-30","context_window":262144,"license":"apache-2.0","parameters":80,"active_parameters":1.6,"page_url":"https://huggingface.co/Qwen/Qwen3-Coder-Next","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"An open-source code model from Qwen. The latest Qwen3-Coder series delivers strong Coding Agent capabilities. It excels at tool calling and environment interaction. It supports autonomous programming and delivers outstanding coding performance while maintaining broad general-purpose abilities.[How to use](https://www.alibabacloud.com/help/en/document_detail/2850166.html) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) #### International If you select the [International](https://www.alibabacloud.com/help/en/document_detail/3004398.html#080da663a75xh) deployment scope, model inference compute resources are dynamically scheduled worldwide, excluding the Chinese mainland. Static data is stored in your selected region. Supported region: Singapore.","tagline":"The open-source Qwen code model.","max_output_tokens":65536},{"id":"Qwen/Qwen3-Next-80B-A3B-Instruct","name":"Qwen3-Next-80B-A3B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":81,"active_parameters":1.6,"page_url":"https://huggingface.co/Qwen/Qwen3-Next-80B-A3B-Instruct","description":"Over the past few months, we have observed increasingly clear trends toward scaling both total parameters and context lengths in the pursuit of more powerful and agentic artificial intelligence (AI). We are excited to share our latest advancements in addressing these demands, centered on improving scaling efficiency through innovative model architecture. We call this next-generation foundation models **Qwen3-Next**.","release_date":"2025-09-09","context_window":262144,"license":"apache-2.0","tagline":"Over the past few months, we have observed increasingly clear trends toward scaling both total parameters and context lengths in the pursuit of more powerful and agentic artificial intelligence (AI).","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-Next-80B-A3B-Thinking","name":"Qwen3-Next-80B-A3B-Thinking","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":81,"active_parameters":1.6,"page_url":"https://huggingface.co/Qwen/Qwen3-Next-80B-A3B-Thinking","description":"Over the past few months, we have observed increasingly clear trends toward scaling both total parameters and context lengths in the pursuit of more powerful and agentic artificial intelligence (AI). We are excited to share our latest advancements in addressing these demands, centered on improving scaling efficiency through innovative model architecture. We call this next-generation foundation models **Qwen3-Next**.","release_date":"2025-09-09","context_window":262144,"license":"apache-2.0","tagline":"Over the past few months, we have observed increasingly clear trends toward scaling both total parameters and context lengths in the pursuit of more powerful and agentic artificial intelligence (AI).","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3Guard-Gen-0.6B","name":"Qwen3Guard-Gen-0.6B","created_by":"qwen","source":"official","description":"**Qwen3Guard** is a series of safety moderation models built upon Qwen3 and trained on a dataset of 1.19 million prompts and responses labeled for safety. The series includes models of three sizes (0.6B, 4B, and 8B) and features two specialized variants: **Qwen3Guard-Gen**, a generative model that frames safety classification as an instruction-following task, and **Qwen3Guard-Stream**, which incorporates a token-level classification head for real-time safety monitoring during incremental text ge…","release_date":"2025-09-23","context_window":32768,"license":"apache-2.0","parameters":0.75,"page_url":"https://huggingface.co/Qwen/Qwen3Guard-Gen-0.6B","architecture":"transformer","model_type":"chat","tagline":"**Qwen3Guard** is a series of safety moderation models built upon Qwen3 and trained on a dataset of 1.19 million prompts and responses labeled for safety.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen3Guard-Gen-4B","name":"Qwen3Guard-Gen-4B","created_by":"qwen","source":"official","description":"**Qwen3Guard** is a series of safety moderation models built upon Qwen3 and trained on a dataset of 1.19 million prompts and responses labeled for safety. The series includes models of three sizes (0.6B, 4B, and 8B) and features two specialized variants: **Qwen3Guard-Gen**, a generative model that frames safety classification as an instruction-following task, and **Qwen3Guard-Stream**, which incorporates a token-level classification head for real-time safety monitoring during incremental text ge…","release_date":"2025-09-23","context_window":32768,"license":"apache-2.0","parameters":4.4,"page_url":"https://huggingface.co/Qwen/Qwen3Guard-Gen-4B","architecture":"transformer","model_type":"chat","tagline":"**Qwen3Guard** is a series of safety moderation models built upon Qwen3 and trained on a dataset of 1.19 million prompts and responses labeled for safety.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-17"},{"id":"Qwen/Qwen3Guard-Gen-8B","name":"Qwen3Guard-Gen-8B","created_by":"qwen","source":"official","description":"**Qwen3Guard** is a series of safety moderation models built upon Qwen3 and trained on a dataset of 1.19 million prompts and responses labeled for safety. The series includes models of three sizes (0.6B, 4B, and 8B) and features two specialized variants: **Qwen3Guard-Gen**, a generative model that frames safety classification as an instruction-following task, and **Qwen3Guard-Stream**, which incorporates a token-level classification head for real-time safety monitoring during incremental text ge…","release_date":"2025-09-23","context_window":32768,"license":"apache-2.0","parameters":8.2,"page_url":"https://huggingface.co/Qwen/Qwen3Guard-Gen-8B","architecture":"transformer","model_type":"chat","tagline":"**Qwen3Guard** is a series of safety moderation models built upon Qwen3 and trained on a dataset of 1.19 million prompts and responses labeled for safety.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"RedHatAI/Meta-Llama-3-8B-Instruct-FP8-KV","name":"Meta-Llama-3-8B-Instruct-FP8-KV","created_by":"redhatai","source":"official","last_updated":"2026-03-23","capabilities":{"streaming":true,"tool_call":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/RedHatAI/Meta-Llama-3-8B-Instruct-FP8-KV","release_date":"2024-05-20","context_window":8192,"architecture":"transformer","tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"RedHatAI/Qwen2-1.5B-Instruct-FP8","name":"Qwen2-1.5B-Instruct-FP8","created_by":"redhatai","source":"official","release_date":"2024-06-14","context_window":32768,"license":"apache-2.0","parameters":1.5,"page_url":"https://huggingface.co/RedHatAI/Qwen2-1.5B-Instruct-FP8","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"RedHatAI/Qwen2-7B-Instruct-FP8","name":"Qwen2-7B-Instruct-FP8","created_by":"redhatai","source":"official","release_date":"2024-06-14","context_window":32768,"license":"apache-2.0","parameters":7.6,"page_url":"https://huggingface.co/RedHatAI/Qwen2-7B-Instruct-FP8","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-14"},{"id":"ricdomolm/mini-coder-1.7b","name":"mini-coder-1.7b","created_by":"ricdomolm","source":"official","description":"`mini-coder-1.7b` is a 1.7B parameter model distilled from Qwen 3 Coder 30B A3B. It punches well above its weight, outperforming SWE-agent-LM 7B on [SWE-bench Verified Bash only](https://www.swebench.com/):","release_date":"2025-09-30","context_window":40960,"license":"mit","parameters":1.7,"page_url":"https://huggingface.co/ricdomolm/mini-coder-1.7b","architecture":"transformer","tagline":"`mini-coder-1.7b` is a 1.7B parameter model distilled from Qwen 3 Coder 30B A3B.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"SakanaAI/TinySwallow-1.5B-Instruct","name":"TinySwallow-1.5B-Instruct","created_by":"sakanaai","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":1.5,"page_url":"https://huggingface.co/SakanaAI/TinySwallow-1.5B-Instruct","description":"🤗 [Models](https://huggingface.co/SakanaAI) | 📚 [Paper](https://arxiv.org/abs/2501.16937) | 📝 [Blog](https://sakana.ai/taid-jp/) | 🐦 [Twitter](https://twitter.com/SakanaAILabs)","release_date":"2025-01-07","context_window":32768,"license":"apache-2.0","tagline":"🤗 [Models](https://huggingface.co/SakanaAI) | 📚 [Paper](https://arxiv.org/abs/2501.16937) | 📝 [Blog](https://sakana.ai/taid-jp/) | 🐦 [Twitter](https://twitter.com/SakanaAILabs)","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"ShahriarFerdoush/llama-3.2-1b-code-instruct","name":"llama-3.2-1b-code-instruct","created_by":"shahriarferdoush","source":"official","family":"llama-3.2","description":"A lightweight yet powerful **code-focused language model** fine-tuned from **Meta Llama-3.2-1B** using **QLoRA (4-bit)** on the **CodeAlpaca-20K** dataset. Designed for **efficient code generation, reasoning, and problem-solving** on limited GPU resources.","release_date":"2025-12-24","context_window":131072,"license":"apache-2.0","parameters":1.2,"page_url":"https://huggingface.co/ShahriarFerdoush/llama-3.2-1b-code-instruct","architecture":"transformer","model_type":"chat","tagline":"A lightweight yet powerful **code-focused language model** fine-tuned from **Meta Llama-3.2-1B** using **QLoRA (4-bit)** on the **CodeAlpaca-20K** dataset.","capabilities":{"streaming":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"last_updated":"2026-05-07"},{"id":"speakleash/Bielik-7B-Instruct-v0.1","name":"Bielik-7B-Instruct-v0.1","created_by":"speakleash","source":"official","last_updated":"2026-03-21","capabilities":{"streaming":true},"parameters":7},{"id":"swap-uniba/LLaMAntino-3-ANITA-8B-Inst-DPO-ITA","name":"LLaMAntino-3-ANITA-8B-Inst-DPO-ITA","created_by":"swap-uniba","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":8,"page_url":"https://huggingface.co/swap-uniba/LLaMAntino-3-ANITA-8B-Inst-DPO-ITA","description":"📣 New MODEL FAMILY❗ [https://huggingface.co/m-polignano/ANITA-NEXT-24B-Magistral-2506-VISION-ITA](https://huggingface.co/m-polignano/ANITA-NEXT-24B-Magistral-2506-VISION-ITA)","release_date":"2024-04-29","context_window":8192,"license":"llama3","tagline":"📣 New MODEL FAMILY❗ [https://huggingface.co/m-polignano/ANITA-NEXT-24B-Magistral-2506-VISION-ITA](https://huggingface.co/m-polignano/ANITA-NEXT-24B-Magistral-2506-VISION-ITA)","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"swiss-ai/Apertus-70B-Instruct-2509","name":"Apertus-70B-Instruct-2509","created_by":"swiss-ai","source":"official","release_date":"2025-09-01","context_window":65536,"license":"apache-2.0","parameters":71,"alias":"swiss-ai/Apertus-70B-Instruct","page_url":"https://huggingface.co/swiss-ai/Apertus-70B-Instruct-2509","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-06-10"},{"id":"swiss-ai/Apertus-70B-Instruct","name":"Apertus-70B-Instruct-2509","created_by":"swiss-ai","source":"official","release_date":"2025-09-01","context_window":65536,"license":"apache-2.0","parameters":71,"page_url":"https://huggingface.co/swiss-ai/Apertus-70B-Instruct-2509","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"snapshots":["swiss-ai/Apertus-70B-Instruct-2509"],"last_updated":"2026-06-10"},{"id":"swiss-ai/Apertus-8B-Instruct-2509","name":"Apertus-8B-Instruct-2509","created_by":"swiss-ai","source":"official","last_updated":"2026-04-21","alias":"swiss-ai/Apertus-8B-Instruct","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":8.1,"page_url":"https://huggingface.co/swiss-ai/Apertus-8B-Instruct-2509","release_date":"2025-08-13","context_window":65536,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"swiss-ai/Apertus-8B-Instruct","name":"Apertus-8B-Instruct-2509","created_by":"swiss-ai","source":"official","last_updated":"2026-04-21","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"snapshots":["swiss-ai/Apertus-8B-Instruct-2509"],"parameters":8.1,"page_url":"https://huggingface.co/swiss-ai/Apertus-8B-Instruct-2509","release_date":"2025-08-13","context_window":65536,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"TinyLlama/TinyLlama-1.1B-Chat-v1.0","name":"TinyLlama-1.1B-Chat-v1.0","created_by":"tinyllama","source":"official","release_date":"2023-12-30","context_window":2048,"license":"apache-2.0","parameters":1.1,"page_url":"https://huggingface.co/TinyLlama/TinyLlama-1.1B-Chat-v1.0","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"tokyotech-llm/Llama-3-Swallow-8B-Instruct-v0.1","name":"Llama-3-Swallow-8B-Instruct-v0.1","created_by":"tokyotech-llm","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/tokyotech-llm/Llama-3-Swallow-8B-Instruct-v0.1","description":"Our Swallow model has undergone continual pre-training from the [Llama 3 family](https://huggingface.co/collections/meta-llama/meta-llama-3-66214712577ca38149ebb2b6), primarily with the addition of Japanese language data. The Instruct versions use supervised fine-tuning (SFT) and Chat Vector. Links to other models can be found in the index.","release_date":"2024-06-26","context_window":8192,"license":"llama3","tagline":"Our Swallow model has undergone continual pre-training from the [Llama 3 family](https://huggingface.co/collections/meta-llama/meta-llama-3-66214712577ca38149ebb2b6), primarily with the addition of Japanese language data.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"tokyotech-llm/Llama-3.1-Swallow-8B-Instruct-v0.5","name":"Llama-3.1-Swallow-8B-Instruct-v0.5","created_by":"tokyotech-llm","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.1","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/tokyotech-llm/Llama-3.1-Swallow-8B-Instruct-v0.5","description":"Llama 3.1 Swallow is a series of large language models (8B, 70B) that were built by continual pre-training on the [Meta Llama 3.1](https://huggingface.co/collections/meta-llama/llama-31-669fc079a0c406a149a5738f) models. Llama 3.1 Swallow enhanced the Japanese language capabilities of the original Llama 3.1 while retaining the English language capabilities.","release_date":"2025-06-12","context_window":131072,"license":"llama3.3","tagline":"Llama 3.1 Swallow is a series of large language models (8B, 70B) that were built by continual pre-training on the [Meta Llama 3.1](https://huggingface.co/collections/meta-llama/llama-31-669fc079a0c406a149a5738f) models.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/gemma-2-9b-it","name":"gemma-2-9b-it","created_by":"unsloth","source":"official","last_updated":"2026-03-27","family":"gemma-2","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":9.2,"page_url":"https://huggingface.co/unsloth/gemma-2-9b-it","release_date":"2024-07-03","context_window":8192,"license":"gemma","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/gemma-3-1b-it","name":"gemma-3-1b-it","created_by":"unsloth","source":"official","family":"gemma-3","description":"- Fine-tune Gemma 3 (12B) for free using our Google [Colab notebook here](https://docs.unsloth.ai/get-started/unsloth-notebooks)! - Read our Blog about Gemma 3 support: [unsloth.ai/blog/gemma3](https://unsloth.ai/blog/gemma3) - View the rest of our notebooks in our [docs here](https://docs.unsloth.ai/get-started/unsloth-notebooks). - Export your fine-tuned model to GGUF, Ollama, llama.cpp or 🤗HF.","release_date":"2025-03-12","context_window":32768,"license":"gemma","parameters":1,"page_url":"https://huggingface.co/unsloth/gemma-3-1b-it","architecture":"transformer","model_type":"chat","tagline":"- Fine-tune Gemma 3 (12B) for free using our Google [Colab notebook here](https://docs.unsloth.ai/get-started/unsloth-notebooks)! - Read our Blog about Gemma 3 support: [unsloth.ai/blog/gemma3](https://unsloth.ai/blog/gemma3) - View the rest of our notebooks in our [docs here](https://docs.unsloth.ai/get-started/unsloth-notebooks).","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"unsloth/llama-3-8b-Instruct","name":"llama-3-8b-Instruct","created_by":"unsloth","source":"official","last_updated":"2026-03-24","family":"llama-3","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":8,"page_url":"https://huggingface.co/unsloth/llama-3-8b-Instruct","description":"Directly quantized 4bit model with `bitsandbytes`.","release_date":"2024-04-18","context_window":8192,"license":"llama3","tagline":"Directly quantized 4bit model with `bitsandbytes`.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Llama-3.1-8B-Instruct","name":"Llama-3.1-8B-Instruct","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.1","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/unsloth/Llama-3.1-8B-Instruct","release_date":"2025-02-15","context_window":131072,"license":"llama3.1","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Llama-3.2-1B-Instruct","name":"Llama-3.2-1B-Instruct","created_by":"unsloth","source":"official","family":"Llama-3.2","release_date":"2024-09-25","context_window":131072,"license":"llama3.2","parameters":1.2,"page_url":"https://huggingface.co/unsloth/Llama-3.2-1B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"unsloth/Llama-3.2-3B-Instruct","name":"Llama-3.2-3B-Instruct","created_by":"unsloth","source":"official","family":"Llama-3.2","release_date":"2024-09-25","context_window":131072,"license":"llama3.2","parameters":3.2,"page_url":"https://huggingface.co/unsloth/Llama-3.2-3B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"unsloth/Llama-3.3-70B-Instruct","name":"Llama-3.3-70B-Instruct","created_by":"unsloth","source":"official","family":"Llama-3.3","release_date":"2024-12-06","context_window":131072,"license":"llama3.3","parameters":71,"page_url":"https://huggingface.co/unsloth/Llama-3.3-70B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-06"},{"id":"unsloth/Meta-Llama-3.1-8B-Instruct","name":"Meta-Llama-3.1-8B-Instruct","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.1","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/unsloth/Meta-Llama-3.1-8B-Instruct","description":"We have a free Google Colab Tesla T4 notebook for Llama 3.1 (8B) here: https://colab.research.google.com/drive/1Ys44kVvmeZtnICzWz0xgpRnrIOjZAuxp?usp=sharing","release_date":"2024-07-23","context_window":131072,"license":"llama3.1","tagline":"We have a free Google Colab Tesla T4 notebook for Llama 3.1 (8B) here: https://colab.research.google.com/drive/1Ys44kVvmeZtnICzWz0xgpRnrIOjZAuxp?usp=sharing","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Mistral-Small-24B-Instruct-2501","name":"Mistral-Small-24B-Instruct-2501","created_by":"unsloth","source":"official","last_updated":"2026-03-24","alias":"unsloth/Mistral-Small-24B-Instruct","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":24,"page_url":"https://huggingface.co/unsloth/Mistral-Small-24B-Instruct-2501","description":"We have a free Google Colab Tesla T4 notebook for Mistral (7B) here: https://colab.research.google.com/github/unslothai/notebooks/blob/main/nb/Mistral_v0.3_(7B)-Conversational.ipynb","release_date":"2025-01-30","context_window":32768,"license":"apache-2.0","tagline":"We have a free Google Colab Tesla T4 notebook for Mistral (7B) here: https://colab.research.google.com/github/unslothai/notebooks/blob/main/nb/Mistral_v0.3_(7B)-Conversational.ipynb","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Mistral-Small-24B-Instruct","name":"Mistral-Small-24B-Instruct-2501","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"snapshots":["unsloth/Mistral-Small-24B-Instruct-2501"],"model_type":"chat","parameters":24,"page_url":"https://huggingface.co/unsloth/Mistral-Small-24B-Instruct-2501","description":"We have a free Google Colab Tesla T4 notebook for Mistral (7B) here: https://colab.research.google.com/github/unslothai/notebooks/blob/main/nb/Mistral_v0.3_(7B)-Conversational.ipynb","release_date":"2025-01-30","context_window":32768,"license":"apache-2.0","tagline":"We have a free Google Colab Tesla T4 notebook for Mistral (7B) here: https://colab.research.google.com/github/unslothai/notebooks/blob/main/nb/Mistral_v0.3_(7B)-Conversational.ipynb","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Qwen2.5-0.5B-Instruct","name":"Qwen2.5-0.5B-Instruct","created_by":"unsloth","source":"official","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-09-18","context_window":32768,"license":"apache-2.0","parameters":0.49,"page_url":"https://huggingface.co/unsloth/Qwen2.5-0.5B-Instruct","architecture":"transformer","model_type":"chat","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"unsloth/Qwen2.5-1.5B-Instruct","name":"Qwen2.5-1.5B-Instruct","created_by":"unsloth","source":"official","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-09-18","context_window":32768,"license":"apache-2.0","parameters":1.5,"page_url":"https://huggingface.co/unsloth/Qwen2.5-1.5B-Instruct","architecture":"transformer","model_type":"chat","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"unsloth/Qwen2.5-14B-Instruct","name":"Qwen2.5-14B-Instruct","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":15,"page_url":"https://huggingface.co/unsloth/Qwen2.5-14B-Instruct","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-09-23","context_window":32768,"license":"apache-2.0","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Qwen2.5-32B-Instruct","name":"Qwen2.5-32B-Instruct","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":33,"page_url":"https://huggingface.co/unsloth/Qwen2.5-32B-Instruct","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-09-23","context_window":32768,"license":"apache-2.0","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Qwen2.5-3B-Instruct","name":"Qwen2.5-3B-Instruct","created_by":"unsloth","source":"official","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-09-18","context_window":32768,"license":"other","parameters":3.1,"page_url":"https://huggingface.co/unsloth/Qwen2.5-3B-Instruct","architecture":"transformer","model_type":"chat","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"unsloth/Qwen2.5-7B-Instruct","name":"Qwen2.5-7B-Instruct","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":7.6,"page_url":"https://huggingface.co/unsloth/Qwen2.5-7B-Instruct","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-09-18","context_window":32768,"license":"apache-2.0","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Qwen2.5-Coder-32B-Instruct","name":"Qwen2.5-Coder-32B-Instruct","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":33,"page_url":"https://huggingface.co/unsloth/Qwen2.5-Coder-32B-Instruct","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-11-12","context_window":32768,"license":"apache-2.0","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Qwen2.5-Coder-7B-Instruct","name":"Qwen2.5-Coder-7B-Instruct","created_by":"unsloth","source":"official","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-09-23","context_window":32768,"license":"apache-2.0","parameters":7.6,"page_url":"https://huggingface.co/unsloth/Qwen2.5-Coder-7B-Instruct","architecture":"transformer","model_type":"code","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-16"},{"id":"unsloth/Qwen3-1.7B-Base","name":"Qwen3-1.7B-Base","created_by":"unsloth","source":"official","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","page_url":"https://huggingface.co/unsloth/Qwen3-1.7B-Base","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"last_updated":"2026-05-17"},{"id":"unsloth/Qwen3-4B-Base","name":"Qwen3-4B-Base","created_by":"unsloth","source":"official","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","page_url":"https://huggingface.co/unsloth/Qwen3-4B-Base","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"last_updated":"2026-06-02"},{"id":"unsloth/Qwen3-4B-Instruct-2507","name":"Qwen3-4B-Instruct-2507","created_by":"unsloth","source":"official","release_date":"2025-08-06","context_window":262144,"model_type":"chat","license":"apache-2.0","alias":"unsloth/Qwen3-4B-Instruct","page_url":"https://huggingface.co/unsloth/Qwen3-4B-Instruct-2507","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"unsloth/Qwen3-4B-Instruct","name":"Qwen3-4B-Instruct-2507","created_by":"unsloth","source":"official","release_date":"2025-08-06","context_window":262144,"license":"apache-2.0","page_url":"https://huggingface.co/unsloth/Qwen3-4B-Instruct-2507","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"snapshots":["unsloth/Qwen3-4B-Instruct-2507"],"last_updated":"2026-05-01"},{"id":"unsloth/Qwen3-8B-Base","name":"Qwen3-8B-Base","created_by":"unsloth","source":"official","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","page_url":"https://huggingface.co/unsloth/Qwen3-8B-Base","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"last_updated":"2026-03-26"},{"id":"unsloth/Qwen3-8B","name":"Qwen3-8B","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":8,"page_url":"https://huggingface.co/unsloth/Qwen3-8B","release_date":"2025-04-28","context_window":40960,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/tinyllama-chat","name":"tinyllama-chat","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"page_url":"https://huggingface.co/unsloth/tinyllama-chat","description":"[](https://discord.gg/u54VK8m8tk) [](https://ko-fi.com/unsloth) [](https://github.com/unslothai/unsloth)","release_date":"2024-02-14","context_window":2048,"license":"apache-2.0","parameters":1.1,"tagline":"[](https://discord.gg/u54VK8m8tk) [Discord community.","release_date":"2025-07-20","context_window":131072,"license":"mit","tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-4.5-Air","name":"GLM-4.5-Air","created_by":"zhipu","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-4.5","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-4.5-Air","description":"👋 Join our Discord community.","release_date":"2025-07-20","context_window":131072,"license":"mit","parameters":110,"tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-4.5","name":"GLM-4.5","created_by":"zhipu","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-4.5","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-4.5","description":"👋 Join our Discord community.","release_date":"2025-07-20","context_window":131072,"license":"mit","parameters":358,"tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-4.6-FP8","name":"GLM-4.6-FP8","created_by":"zhipu","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-4.6","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-4.6-FP8","description":"👋 Join our Discord community.","release_date":"2025-09-29","context_window":202752,"license":"mit","tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-4.6","name":"GLM-4.6","created_by":"zhipu","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-4.6","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-4.6","description":"👋 Join our Discord community.","release_date":"2025-09-29","context_window":202752,"license":"mit","parameters":357,"tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-4.7-Flash","name":"GLM-4.7-Flash","created_by":"zhipu","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-4.7","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-4.7-Flash","description":"👋 Join our Discord community.","release_date":"2026-01-19","context_window":202752,"license":"mit","parameters":31,"tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-4.7-FP8","name":"GLM-4.7-FP8","created_by":"zhipu","source":"official","last_updated":"2026-05-29","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-4.7","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-4.7-FP8","description":"👋 Join our Discord community.","release_date":"2025-12-22","context_window":202752,"license":"mit","tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"parameters":358},{"id":"zai-org/GLM-4.7","name":"GLM-4.7","created_by":"zhipu","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-4.7","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-4.7","description":"👋 Join our Discord community.","release_date":"2025-12-22","context_window":202752,"license":"mit","parameters":358,"tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-5.1-FP8","name":"GLM-5.1-FP8","created_by":"zhipu","source":"official","family":"GLM-5.1","release_date":"2026-04-03","context_window":202752,"license":"mit","parameters":754,"page_url":"https://huggingface.co/zai-org/GLM-5.1-FP8","architecture":"moe","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-10"},{"id":"zai-org/GLM-5.1","name":"GLM-5.1","created_by":"zhipu","source":"official","family":"GLM-5.1","release_date":"2026-04-03","context_window":202752,"license":"mit","parameters":754,"page_url":"https://huggingface.co/zai-org/GLM-5.1","architecture":"moe","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-12"},{"id":"zai-org/GLM-5.2-FP8","name":"GLM-5.2-FP8","created_by":"zhipu","source":"official","family":"GLM-5.2","release_date":"2026-06-16","context_window":1048576,"license":"mit","parameters":753,"page_url":"https://huggingface.co/zai-org/GLM-5.2-FP8","architecture":"moe","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-20"},{"id":"zai-org/GLM-5.2","name":"GLM-5.2","created_by":"zhipu","source":"official","family":"GLM-5.2","release_date":"2026-06-16","context_window":1048576,"license":"mit","parameters":753,"page_url":"https://huggingface.co/zai-org/GLM-5.2","architecture":"moe","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"zai-org/GLM-5","name":"GLM-5","created_by":"zhipu","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-5","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-5","description":"👋 Join our WeChat or Discord community.","release_date":"2026-02-11","context_window":202752,"license":"mit","parameters":754,"tagline":"👋 Join our WeChat or Discord","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-Z1-32B-0414","name":"GLM-Z1-32B-0414","created_by":"zhipu","source":"official","last_updated":"2026-03-21","capabilities":{"streaming":true},"model_type":"chat","family":"glm","parameters":32}]}; +export const provider: ProviderWithModels = {"id":"huggingface","name":"Hugging Face","region":"US","headquarters":"New York, NY","founded":2016,"url":"https://huggingface.co","api_url":"https://router.huggingface.co/v1","docs_url":"https://huggingface.co/docs/api-inference","pricing_url":"https://huggingface.co/pricing","description":"The AI community platform hosting open-source models with serverless inference endpoints.","type":"aggregator","sdk":{"python":"huggingface_hub","javascript":"@huggingface/inference"},"openai_compatible":true,"free_tier":true,"github_url":"https://github.com/huggingface","models_url":"https://huggingface.co/models","twitter_url":"https://x.com/huggingface","discord_url":"https://discord.com/invite/hugging-face-879548962464493619","blog_url":"https://huggingface.co/blog","terms_url":"https://huggingface.co/terms-of-service","support_url":"https://huggingface.co/support","icon":"\n \n","models":[{"id":"0xgr3y/Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-tall_tame_panther","name":"Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-tall_tame_panther","created_by":"0xgr3y","source":"official","release_date":"2025-11-13","context_window":32768,"license":"mit","parameters":0.49,"page_url":"https://huggingface.co/0xgr3y/Qwen2.5-Coder-0.5B-Instruct-Gensyn-Swarm-tall_tame_panther","architecture":"transformer","model_type":"code","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"aaditya/Llama3-OpenBioLLM-8B","name":"Llama3-OpenBioLLM-8B","created_by":"aaditya","source":"official","last_updated":"2026-03-24","page_url":"https://huggingface.co/aaditya/Llama3-OpenBioLLM-8B","model_type":"chat","capabilities":{"streaming":true,"fine_tuning":true},"description":"Introducing OpenBioLLM-8B: A State-of-the-Art Open Source Biomedical Large Language Model","release_date":"2024-04-20","context_window":8192,"license":"llama3","tagline":"Introducing OpenBioLLM-8B: A State-of-the-Art Open Source Biomedical Large Language Model","architecture":"transformer","open_weight":true,"modalities":{"input":["text"],"output":["text"]}},{"id":"allenai/Olmo-3-7B-Instruct","name":"Olmo-3-7B-Instruct","created_by":"allenai","source":"official","last_updated":"2026-06-29","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":7.3,"page_url":"https://huggingface.co/allenai/Olmo-3-7B-Instruct","release_date":"2025-11-19","context_window":65536,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"allenai/Olmo-3.1-32B-Instruct","name":"Olmo-3.1-32B-Instruct","created_by":"allenai","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":32,"page_url":"https://huggingface.co/allenai/Olmo-3.1-32B-Instruct","release_date":"2025-12-10","context_window":65536,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"alpindale/Llama-3.2-1B-Instruct","name":"Llama-3.2-1B-Instruct","created_by":"alpindale","source":"official","family":"Llama-3.2","release_date":"2024-09-25","context_window":131072,"license":"llama3.2","parameters":1.2,"page_url":"https://huggingface.co/alpindale/Llama-3.2-1B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-01"},{"id":"anthracite-org/magnum-v4-72b","name":"magnum-v4-72b","created_by":"anthracite-org","source":"official","description":"This is a series of models designed to replicate the prose quality of the Claude 3 models, specifically Sonnet and Opus.","release_date":"2024-09-20","context_window":32768,"license":"apache-2.0","parameters":73,"page_url":"https://huggingface.co/anthracite-org/magnum-v4-72b","architecture":"transformer","tagline":"This is a series of models designed to replicate the prose quality of the Claude 3 models, specifically Sonnet and Opus.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"arcee-ai/Trinity-Large-Thinking","name":"Trinity-Large-Thinking","created_by":"arcee-ai","source":"official","description":"src=\"https://cdn-uploads.huggingface.co/production/uploads/6435718aaaef013d1aec3b8b/i-v1KyAMOW_mgVGeic9WJ.png\" alt=\"Arcee Trinity Large Thinking\" style=\"max-width: 100%; height: auto;\" >","release_date":"2026-04-01","context_window":262144,"license":"apache-2.0","parameters":399,"active_parameters":6.2,"page_url":"https://huggingface.co/arcee-ai/Trinity-Large-Thinking","architecture":"moe","tagline":"src=\"https://cdn-uploads.huggingface.co/production/uploads/6435718aaaef013d1aec3b8b/i-v1KyAMOW_mgVGeic9WJ.png\" alt=\"Arcee Trinity Large Thinking\" style=\"max-width: 100%; height: auto;\" >","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-10"},{"id":"argilla/Llama-3.2-1B-Instruct-APIGen-FC-v0.1","name":"Llama-3.2-1B-Instruct-APIGen-FC-v0.1","created_by":"argilla","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.2","model_type":"chat","parameters":1,"page_url":"https://huggingface.co/argilla/Llama-3.2-1B-Instruct-APIGen-FC-v0.1","description":"This model is a fine-tuned version of [meta-llama/Llama-3.2-1B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct) on [argilla-warehouse/apigen-synth-trl](https://huggingface.co/datasets/argilla-warehouse/apigen-synth-trl) dataset, a version of [argilla/Synth-APIGen-v0.1](https://huggingface.co/datasets/argilla-warehouse/Synth-APIGen-v0.1) ready to do SFT on top of it. It has been trained using [TRL](https://github.com/huggingface/trl).","release_date":"2024-10-07","context_window":131072,"license":"apache-2.0","tagline":"This model is a fine-tuned version of [meta-llama/Llama-3.2-1B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct) on [argilla-warehouse/apigen-synth-trl](https://huggingface.co/datasets/argilla-warehouse/apigen-synth-trl) dataset, a version of [argilla/Synth-APIGen-v0.1](https://huggingface.co/datasets/argilla-warehouse/Synth-APIGen-v0.1) ready to do SFT on top of it.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"argilla-warehouse/Llama-3.2-1B-Instruct-v2-FC","name":"Llama-3.2-1B-Instruct-v2-FC","created_by":"argilla-warehouse","source":"official","last_updated":"2026-03-23","capabilities":{"streaming":true,"tool_call":true},"family":"Llama-3.2","model_type":"chat","parameters":1,"page_url":"https://huggingface.co/argilla-warehouse/Llama-3.2-1B-Instruct-v2-FC","description":"This model is a fine-tuned version of [meta-llama/Llama-3.2-1B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct) on the [argilla-warehouse/apigen-smollm-trl-FC](https://huggingface.co/datasets/argilla-warehouse/apigen-smollm-trl-FC) dataset. It has been trained using [TRL](https://github.com/huggingface/trl).","release_date":"2024-10-20","context_window":131072,"tagline":"This model is a fine-tuned version of [meta-llama/Llama-3.2-1B-Instruct](https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct) on the [argilla-warehouse/apigen-smollm-trl-FC](https://huggingface.co/datasets/argilla-warehouse/apigen-smollm-trl-FC) dataset.","architecture":"transformer","tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"baseten/Llama-3.2-3B-Instruct-pythonic","name":"Llama-3.2-3B-Instruct-pythonic","created_by":"baseten","source":"official","family":"Llama-3.2","release_date":"2025-09-12","context_window":131072,"license":"llama3.2","parameters":3.2,"page_url":"https://huggingface.co/baseten/Llama-3.2-3B-Instruct-pythonic","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"codellama/CodeLlama-7b-Instruct-hf","name":"CodeLlama-7b-Instruct-hf","created_by":"codellama","source":"official","family":"codellama","description":"Code Llama is a collection of pretrained and fine-tuned generative text models ranging in scale from 7 billion to 34 billion parameters. This is the repository for the 7B instruct-tuned version in the Hugging Face Transformers format. This model is designed for general code synthesis and understanding. Links to other models can be found in the index at the bottom.","release_date":"2023-08-24","context_window":16384,"license":"llama2","parameters":6.7,"page_url":"https://huggingface.co/codellama/CodeLlama-7b-Instruct-hf","architecture":"transformer","model_type":"code","tagline":"Code Llama is a collection of pretrained and fine-tuned generative text models ranging in scale from 7 billion to 34 billion parameters.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"deepcogito/cogito-v1-preview-qwen-32B","name":"cogito-v1-preview-qwen-32B","created_by":"deepcogito","source":"official","release_date":"2025-03-31","context_window":131072,"license":"apache-2.0","page_url":"https://huggingface.co/deepcogito/cogito-v1-preview-qwen-32B","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29","parameters":33},{"id":"DeepMount00/Llama-3-8b-Ita","name":"Llama-3-8b-Ita","created_by":"deepmount00","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/DeepMount00/Llama-3-8b-Ita","description":"**💡 Found this resource helpful?** Creating and maintaining open source AI models and datasets requires significant computational resources. If this work has been valuable to you, consider [supporting my research](https://buymeacoffee.com/michele.montebovi) to help me continue building tools that benefit the entire AI community. Every contribution directly funds more open source innovation! ☕","release_date":"2024-05-01","context_window":8192,"license":"llama3","tagline":"**💡 Found this resource helpful?** Creating and maintaining open source AI models and datasets requires significant computational resources.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"deepreinforce-ai/Ornith-1.0-35B","name":"Ornith-1.0-35B","created_by":"deepreinforce-ai","source":"official","release_date":"2026-06-21","license":"mit","parameters":0,"page_url":"https://huggingface.co/deepreinforce-ai/Ornith-1.0-35B","architecture":"moe","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-06-30"},{"id":"deepseek-ai/DeepSeek-R1-0528-Qwen3-8B","name":"DeepSeek-R1-0528-Qwen3-8B","created_by":"deepseek","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"reasoning","parameters":8.2,"page_url":"https://huggingface.co/deepseek-ai/DeepSeek-R1-0528-Qwen3-8B","release_date":"2025-05-29","context_window":131072,"license":"mit","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"defog/sqlcoder-7b-2","name":"sqlcoder-7b-2","created_by":"defog","source":"official","description":"The model weights were updated at 7 AM UTC on Feb 7, 2024. The new model weights lead to a much more performant model – particularly for joins.","release_date":"2024-02-05","context_window":16384,"license":"cc-by-sa-4.0","parameters":6.7,"page_url":"https://huggingface.co/defog/sqlcoder-7b-2","architecture":"transformer","tagline":"The model weights were updated at 7 AM UTC on Feb 7, 2024.","capabilities":{"streaming":true,"fine_tuning":true},"open_weight":true,"last_updated":"2026-06-18"},{"id":"DeSTA-ntu/Llama-3.1-8B-Instruct","name":"Llama-3.1-8B-Instruct","created_by":"desta-ntu","source":"official","family":"Llama-3.1","release_date":"2025-07-06","context_window":131072,"parameters":8,"page_url":"https://huggingface.co/DeSTA-ntu/Llama-3.1-8B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"dicta-il/DictaLM-3.0-1.7B-Instruct","name":"DictaLM-3.0-1.7B-Instruct","created_by":"dicta-il","source":"official","description":"[](https://dicta.org.il)","release_date":"2025-12-01","context_window":62080,"license":"apache-2.0","page_url":"https://huggingface.co/dicta-il/DictaLM-3.0-1.7B-Instruct","architecture":"transformer","tagline":"[](https://dicta.org.il)","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-06-10"},{"id":"dphn/Dolphin-Mistral-24B-Venice-Edition","name":"Dolphin-Mistral-24B-Venice-Edition","created_by":"dphn","source":"official","description":"Website: https://dphn.ai Twitter: https://x.com/dphnAI Web Chat: https://chat.dphn.ai Telegram bot: https://t.me/DolphinAI_bot","release_date":"2025-06-12","context_window":32768,"license":"apache-2.0","parameters":24,"page_url":"https://huggingface.co/dphn/Dolphin-Mistral-24B-Venice-Edition","architecture":"transformer","tagline":"Website: https://dphn.ai Twitter: https://x.com/dphnAI Web Chat: https://chat.dphn.ai Telegram bot: https://t.me/DolphinAI_bot","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-07"},{"id":"Efficient-Large-Model/gemma-2-2b-it","name":"gemma-2-2b-it","created_by":"efficient-large-model","source":"official","last_updated":"2026-03-24","family":"gemma-2","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":2.6,"page_url":"https://huggingface.co/Efficient-Large-Model/gemma-2-2b-it","description":"**Model Page**: [Gemma](https://ai.google.dev/gemma/docs/base)","release_date":"2024-12-12","context_window":8192,"license":"gemma","tagline":"**Model Page**: [Gemma](https://ai.google.dev/gemma/docs/base)","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"EssentialAI/rnj-1-instruct","name":"rnj-1-instruct","created_by":"essentialai","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"page_url":"https://huggingface.co/EssentialAI/rnj-1-instruct","description":"Rnj-1 is a family of 8B parameter open-weight, dense models trained from scratch by Essential AI, optimized for code and STEM with capabilities on par with SOTA open-weight models. These models perform well across a range of programming languages and boast strong agentic capabilities (e.g., inside agentic frameworks like mini-SWE-agent), while also excelling at tool-calling. They additionally exhibit strong capabilities in math and science.","release_date":"2025-12-04","context_window":32768,"license":"apache-2.0","parameters":8.3,"tagline":"style=\"vertical-align: middle;\" src=\"https://img.shields.io/badge/%F0%9F%8C%90%20Website-essential.ai-4b9fe1?color=4b9fe1&logoColor=white\"/>","architecture":"transformer","open_weight":true,"tools":["function_calling"],"model_type":"chat","modalities":{"input":["text"],"output":["text"]}},{"id":"failspy/llama-3-70B-Instruct-abliterated","name":"llama-3-70B-Instruct-abliterated","created_by":"failspy","source":"official","family":"llama-3","description":"This is meta-llama/Llama-3-70B-Instruct with orthogonalized bfloat16 safetensor weights, generated with the methodology that was described in the preview paper/blog post: '[Refusal in LLMs is mediated by a single direction](https://www.alignmentforum.org/posts/jGuXSZgv6qfdhMCuJ/refusal-in-llms-is-mediated-by-a-single-direction)' which I encourage you to read to understand more.","release_date":"2024-05-07","context_window":8192,"license":"llama3","page_url":"https://huggingface.co/failspy/llama-3-70B-Instruct-abliterated","architecture":"transformer","model_type":"chat","tagline":"This is meta-llama/Llama-3-70B-Instruct with orthogonalized bfloat16 safetensor weights, generated with the methodology that was described in the preview paper/blog post: '[Refusal in LLMs is mediated","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-07"},{"id":"failspy/Meta-Llama-3-8B-Instruct-abliterated-v3","name":"Meta-Llama-3-8B-Instruct-abliterated-v3","created_by":"failspy","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/failspy/Meta-Llama-3-8B-Instruct-abliterated-v3","description":"[My Jupyter \"cookbook\" to replicate the methodology can be found here, refined library coming soon](https://huggingface.co/failspy/llama-3-70B-Instruct-abliterated/blob/main/ortho_cookbook.ipynb)","release_date":"2024-05-20","context_window":8192,"license":"llama3","tagline":"[My Jupyter \"cookbook\" to replicate the methodology can be found here, refined library coming soon](https://huggingface.co/failspy/llama-3-70B-Instruct-abliterated/blob/main/ortho_cookbook.ipynb)","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"farbodtavakkoli/OTel-LLM-0.6B-IT","name":"OTel-LLM-0.6B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-0.6B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":40960,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-0.6B-IT","architecture":"transformer","tagline":"**OTel-LLM-0.6B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-1.2B-IT","name":"OTel-LLM-1.2B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-1.2B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-03-10","context_window":128000,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-1.2B-IT","architecture":"transformer","tagline":"**OTel-LLM-1.2B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-1.7B-IT","name":"OTel-LLM-1.7B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-1.7B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":40960,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-1.7B-IT","architecture":"transformer","tagline":"**OTel-LLM-1.7B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-12B-IT","name":"OTel-LLM-12B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-12B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-12B-IT","architecture":"transformer","tagline":"**OTel-LLM-12B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-22"},{"id":"farbodtavakkoli/OTel-LLM-14B-IT","name":"OTel-LLM-14B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-14B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":40960,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-14B-IT","architecture":"transformer","tagline":"**OTel-LLM-14B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-1B-IT","name":"OTel-LLM-1B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-1B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":32768,"license":"apache-2.0","parameters":1,"page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-1B-IT","architecture":"transformer","tagline":"**OTel-LLM-1B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-20B-IT","name":"OTel-LLM-20B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-20B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-13","context_window":131072,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-20B-IT","architecture":"moe","tagline":"**OTel-LLM-20B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-270M-IT","name":"OTel-LLM-270M-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-270M-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":32768,"license":"apache-2.0","parameters":0.27,"page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-270M-IT","architecture":"transformer","tagline":"**OTel-LLM-270M-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-27B-IT","name":"OTel-LLM-27B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-27B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-27B-IT","architecture":"transformer","tagline":"**OTel-LLM-27B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-22"},{"id":"farbodtavakkoli/OTel-LLM-32B-IT","name":"OTel-LLM-32B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-32B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":65536,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-32B-IT","architecture":"transformer","tagline":"**OTel-LLM-32B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-4B-IT","name":"OTel-LLM-4B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-4B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","license":"apache-2.0","parameters":4.3,"page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-4B-IT","architecture":"transformer","tagline":"**OTel-LLM-4B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-7B-IT","name":"OTel-LLM-7B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-7B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":65536,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-7B-IT","architecture":"transformer","tagline":"**OTel-LLM-7B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-8.2B-IT","name":"OTel-LLM-8.2B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-8.2B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":40960,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-8.2B-IT","architecture":"transformer","tagline":"**OTel-LLM-8.2B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"farbodtavakkoli/OTel-LLM-8.3B-IT","name":"OTel-LLM-8.3B-IT","created_by":"farbodtavakkoli","source":"official","description":"**OTel-LLM-8.3B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data. It is part of the [OTel Family of Models](https://huggingface.co/collections/farbodtavakkoli/otel-llm), an open-source initiative to build industry-standard AI models for the global telecommunications sector.","release_date":"2026-02-11","context_window":32768,"license":"apache-2.0","page_url":"https://huggingface.co/farbodtavakkoli/OTel-LLM-8.3B-IT","architecture":"transformer","tagline":"**OTel-LLM-8.3B-IT** is a telecom-specialized language model fine-tuned on telecommunications domain data.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"fdtn-ai/Foundation-Sec-8B-Instruct","name":"Foundation-Sec-8B-Instruct","created_by":"fdtn-ai","source":"official","release_date":"2025-07-29","context_window":131072,"license":"other","parameters":8,"page_url":"https://huggingface.co/fdtn-ai/Foundation-Sec-8B-Instruct","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-04-01"},{"id":"Featherless-Chat-Models/Mistral-7B-Instruct-v0.2","name":"Mistral-7B-Instruct-v0.2","created_by":"featherless-chat-models","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":7.2,"page_url":"https://huggingface.co/Featherless-Chat-Models/Mistral-7B-Instruct-v0.2","release_date":"2025-05-08","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"FlagAlpha/Llama3-Chinese-8B-Instruct","name":"Llama3-Chinese-8B-Instruct","created_by":"flagalpha","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":8,"page_url":"https://huggingface.co/FlagAlpha/Llama3-Chinese-8B-Instruct","description":"Llama3-Chinese-8B-Instruct基于Llama3-8B中文微调对话模型,由Llama中文社区和AtomEcho(原子回声)联合研发,我们会持续提供更新的模型参数,模型训练过程见 [https://llama.family](https://llama.family)。","release_date":"2024-04-23","context_window":8192,"license":"apache-2.0","tagline":"Llama3-Chinese-8B-Instruct基于Llama3-8B中文微调对话模型,由Llama中文社区和AtomEcho(原子回声)联合研发,我们会持续提供更新的模型参数,模型训练过程见 [https://llama.family](https://llama.family)。","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"google/gemma-1.1-2b-it","name":"gemma-1.1-2b-it","created_by":"google","source":"official","family":"gemma-1","release_date":"2024-03-26","license":"gemma","parameters":2.5,"page_url":"https://huggingface.co/google/gemma-1.1-2b-it","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"google/gemma-2-27b-it","name":"gemma-2-27b-it","created_by":"google","source":"official","family":"gemma-2","release_date":"2024-06-24","license":"gemma","parameters":27,"page_url":"https://huggingface.co/google/gemma-2-27b-it","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"google/gemma-2-2b-it","name":"gemma-2-2b-it","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-2","release_date":"2024-07-16","license":"gemma","parameters":2.6,"page_url":"https://huggingface.co/google/gemma-2-2b-it","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"]},{"id":"google/gemma-2-2b-jpn-it","name":"gemma-2-2b-jpn-it","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-2","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":2.6,"page_url":"https://huggingface.co/google/gemma-2-2b-jpn-it","release_date":"2024-09-25","license":"gemma","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"google/gemma-2-9b-it","name":"gemma-2-9b-it","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-2","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":9.2,"page_url":"https://huggingface.co/google/gemma-2-9b-it","release_date":"2024-06-24","license":"gemma","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"google/gemma-2b-it","name":"gemma-2b-it","created_by":"google","source":"official","family":"gemma-2b","release_date":"2024-02-08","license":"gemma","page_url":"https://huggingface.co/google/gemma-2b-it","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29","parameters":2.5},{"id":"google/gemma-3-1b-it","name":"gemma-3-1b-it","created_by":"google","source":"official","family":"gemma-3","release_date":"2025-03-10","license":"gemma","parameters":1,"page_url":"https://huggingface.co/google/gemma-3-1b-it","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"google/gemma-7b-it","name":"gemma-7b-it","created_by":"google","source":"official","family":"gemma-7b","release_date":"2024-02-13","license":"gemma","page_url":"https://huggingface.co/google/gemma-7b-it","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-18","parameters":8.5},{"id":"google/medgemma-27b-text-it","name":"medgemma-27b-text-it","created_by":"google","source":"official","release_date":"2025-05-19","license":"other","page_url":"https://huggingface.co/google/medgemma-27b-text-it","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-05-29","parameters":27},{"id":"GraySwanAI/Llama-3-8B-Instruct-RR","name":"Llama-3-8B-Instruct-RR","created_by":"grayswanai","source":"official","last_updated":"2026-03-23","capabilities":{"streaming":true,"tool_call":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/GraySwanAI/Llama-3-8B-Instruct-RR","description":"Llama-3-8B-Instruct-RR is a Llama-3 model with circuit breakers inserted using Representation Rerouting (RR).","release_date":"2024-07-08","context_window":8192,"tagline":"Llama-3-8B-Instruct-RR is a Llama-3 model with circuit breakers inserted using Representation Rerouting (RR).","architecture":"transformer","tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"GritLM/GritLM-7B","name":"GritLM-7B","created_by":"gritlm","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":7.2,"page_url":"https://huggingface.co/GritLM/GritLM-7B","description":"> GritLM is a generative representational instruction tuned language model. It unifies text representation (embedding) and text generation into a single model achieving state-of-the-art performance on both types of tasks.","release_date":"2024-02-11","context_window":32768,"license":"apache-2.0","tagline":"> GritLM is a generative representational instruction tuned language model.","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"h2oai/h2ogpt-4096-llama2-7b-chat","name":"h2ogpt-4096-llama2-7b-chat","created_by":"h2oai","source":"official","description":"h2oGPT clone of [Meta's Llama 2 7B Chat](https://huggingface.co/meta-llama/Llama-2-7b-chat-hf).","release_date":"2023-08-09","context_window":4096,"license":"llama2","parameters":6.7,"page_url":"https://huggingface.co/h2oai/h2ogpt-4096-llama2-7b-chat","architecture":"transformer","tagline":"h2oGPT clone of [Meta's Llama 2 7B Chat](https://huggingface.co/meta-llama/Llama-2-7b-chat-hf).","capabilities":{"streaming":true,"fine_tuning":true},"open_weight":true,"last_updated":"2026-05-17"},{"id":"huihui-ai/DeepSeek-R1-Distill-Qwen-32B-abliterated","name":"DeepSeek-R1-Distill-Qwen-32B-abliterated","created_by":"huihui-ai","source":"official","description":"This is an uncensored version of [deepseek-ai/DeepSeek-R1-Distill-Qwen-32B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B) created with abliteration (see [remove-refusals-with-transformers](https://github.com/Sumandora/remove-refusals-with-transformers) to know more about it). This is a crude, proof-of-concept implementation to remove refusals from an LLM model without using TransformerLens.","release_date":"2025-01-22","context_window":131072,"parameters":33,"page_url":"https://huggingface.co/huihui-ai/DeepSeek-R1-Distill-Qwen-32B-abliterated","architecture":"transformer","model_type":"reasoning","tagline":"This is an uncensored version of [deepseek-ai/DeepSeek-R1-Distill-Qwen-32B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B) created with abliteration (see [remove-refusals-with-transformers](https://github.com/Sumandora/remove-refusals-with-transformers) to know more about it).","capabilities":{"streaming":true,"tool_call":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-14"},{"id":"huihui-ai/Qwen2.5-14B-Instruct-abliterated-v2","name":"Qwen2.5-14B-Instruct-abliterated-v2","created_by":"huihui-ai","source":"official","description":"This is an uncensored version of [Qwen2.5-14B-Instruct](https://huggingface.co/Qwen/Qwen2.5-14B-Instruct) created with abliteration (see [this article](https://huggingface.co/blog/mlabonne/abliteration) to know more about it).","release_date":"2024-10-09","context_window":32768,"license":"apache-2.0","parameters":15,"page_url":"https://huggingface.co/huihui-ai/Qwen2.5-14B-Instruct-abliterated-v2","architecture":"transformer","model_type":"chat","tagline":"This is an uncensored version of [Qwen2.5-14B-Instruct](https://huggingface.co/Qwen/Qwen2.5-14B-Instruct) created with abliteration (see [this article](https://huggingface.co/blog/mlabonne/abliteratio","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-21"},{"id":"huihui-ai/Qwen2.5-14B-Instruct-abliterated","name":"Qwen2.5-14B-Instruct-abliterated","created_by":"huihui-ai","source":"official","description":"This is an uncensored version of [Qwen/Qwen2.5-14B-Instruct](https://huggingface.co/Qwen/Qwen2.5-14B-Instruct) created with abliteration (see [this article](https://huggingface.co/blog/mlabonne/abliteration) to know more about it).","release_date":"2024-09-25","context_window":32768,"license":"apache-2.0","parameters":15,"page_url":"https://huggingface.co/huihui-ai/Qwen2.5-14B-Instruct-abliterated","architecture":"transformer","model_type":"chat","tagline":"This is an uncensored version of [Qwen/Qwen2.5-14B-Instruct](https://huggingface.co/Qwen/Qwen2.5-14B-Instruct) created with abliteration (see [this article](https://huggingface.co/blog/mlabonne/ablite","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-23"},{"id":"huihui-ai/Qwen2.5-72B-Instruct-abliterated","name":"Qwen2.5-72B-Instruct-abliterated","created_by":"huihui-ai","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":73,"page_url":"https://huggingface.co/huihui-ai/Qwen2.5-72B-Instruct-abliterated","description":"This is an uncensored version of [Qwen/Qwen2.5-72B-Instruct](https://huggingface.co/Qwen/Qwen2.5-72B-Instruct) created with abliteration (see [remove-refusals-with-transformers](https://github.com/Sumandora/remove-refusals-with-transformers) to know more about it). This is a crude, proof-of-concept implementation to remove refusals from an LLM model without using TransformerLens.","release_date":"2024-10-26","context_window":32768,"license":"other","tagline":"This is an uncensored version of [Qwen/Qwen2.5-72B-Instruct](https://huggingface.co/Qwen/Qwen2.5-72B-Instruct) created with abliteration (see [remove-refusals-with-transformers](https://github.com/Sumandora/remove-refusals-with-transformers) to know more about it).","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"instruction-pretrain/finance-Llama3-8B","name":"finance-Llama3-8B","created_by":"instruction-pretrain","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"fine_tuning":true},"parameters":8,"page_url":"https://huggingface.co/instruction-pretrain/finance-Llama3-8B","description":"This repo contains the **finance model developed from Llama3-8B** in our paper [Instruction Pre-Training: Language Models are Supervised Multitask Learners](https://huggingface.co/papers/2406.14491).","release_date":"2024-06-18","context_window":8192,"license":"llama3","tagline":"This repo contains the **finance model developed from Llama3-8B** in our paper [Instruction Pre-Training: Language Models are Supervised Multitask Learners](https://huggingface.co/papers/2406.14491).","architecture":"transformer","open_weight":true},{"id":"Intel/neural-chat-7b-v3-3","name":"neural-chat-7b-v3-3","created_by":"intel","source":"official","last_updated":"2026-03-22","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":7.2,"page_url":"https://huggingface.co/Intel/neural-chat-7b-v3-3","release_date":"2023-12-09","context_window":32768,"license":"apache-2.0"},{"id":"invalid-coder/Sakura-SOLAR-Instruct-CarbonVillain-en-10.7B-v2-slerp","name":"Sakura-SOLAR-Instruct-CarbonVillain-en-10.7B-v2-slerp","created_by":"invalid-coder","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":11,"page_url":"https://huggingface.co/invalid-coder/Sakura-SOLAR-Instruct-CarbonVillain-en-10.7B-v2-slerp","description":"NeuralPipe-7B-slerp is a merge of the following models using [LazyMergekit](https://colab.research.google.com/drive/1obulZ1ROXHjYLn6PPZJwRR6GzgQogxxb?usp=sharing): * [jeonsworld/CarbonVillain-en-10.7B-v2](https://huggingface.co/jeonsworld/CarbonVillain-en-10.7B-v2) * [kyujinpy/Sakura-SOLAR-Instruct](https://huggingface.co/kyujinpy/Sakura-SOLAR-Instruct)","release_date":"2024-01-10","context_window":4096,"license":"apache-2.0","tagline":"NeuralPipe-7B-slerp is a merge of the following models using [LazyMergekit](https://colab.research.google.com/drive/1obulZ1ROXHjYLn6PPZJwRR6GzgQogxxb?usp=sharing): * [jeonsworld/CarbonVillain-en-10.7B","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"kakaocorp/kanana-1.5-8b-instruct-2505","name":"kanana-1.5-8b-instruct-2505","created_by":"kakaocorp","source":"official","release_date":"2025-05-21","context_window":32768,"license":"apache-2.0","alias":"kakaocorp/kanana-1.5-8b-instruct","page_url":"https://huggingface.co/kakaocorp/kanana-1.5-8b-instruct-2505","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-06-10"},{"id":"kakaocorp/kanana-1.5-8b-instruct","name":"kanana-1.5-8b-instruct-2505","created_by":"kakaocorp","source":"official","release_date":"2025-05-21","context_window":32768,"license":"apache-2.0","page_url":"https://huggingface.co/kakaocorp/kanana-1.5-8b-instruct-2505","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"snapshots":["kakaocorp/kanana-1.5-8b-instruct-2505"],"last_updated":"2026-06-10"},{"id":"llmfan46/Gemma-4-Garnet-V2-31B-it-ultra-uncensored-heretic","name":"Gemma-4-Garnet-V2-31B-it-ultra-uncensored-heretic","created_by":"llmfan46","source":"official","release_date":"2026-04-25","license":"apache-2.0","parameters":31,"page_url":"https://huggingface.co/llmfan46/Gemma-4-Garnet-V2-31B-it-ultra-uncensored-heretic","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"lmstudio-community/Qwen3-1.7B-MLX-bf16","name":"Qwen3-1.7B-MLX-bf16","created_by":"lmstudio-community","source":"official","description":"This model [lmstudio-community/Qwen3-1.7B-MLX-bf16](https://huggingface.co/lmstudio-community/Qwen3-1.7B-MLX-bf16) was converted to MLX format from [Qwen/Qwen3-1.7B](https://huggingface.co/Qwen/Qwen3-1.7B) using mlx-lm version **0.24.0**.","release_date":"2025-04-28","context_window":40960,"license":"apache-2.0","parameters":1.7,"page_url":"https://huggingface.co/lmstudio-community/Qwen3-1.7B-MLX-bf16","architecture":"transformer","model_type":"chat","tagline":"This model [lmstudio-community/Qwen3-1.7B-MLX-bf16](https://huggingface.co/lmstudio-community/Qwen3-1.7B-MLX-bf16) was converted to MLX format from [Qwen/Qwen3-1.7B](https://huggingface.co/Qwen/Qwen3-","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"m8than/Mistral-Nemo-Instruct-2407-lenient-chatfix","name":"Mistral-Nemo-Instruct-2407-lenient-chatfix","created_by":"m8than","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","page_url":"https://huggingface.co/m8than/Mistral-Nemo-Instruct-2407-lenient-chatfix","description":"It's just mistral nemo 2407 with a less strict chat format.","release_date":"2025-05-06","context_window":131072,"license":"apache-2.0","parameters":12,"tagline":"It's just mistral nemo 2407 with a less strict chat format.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"meta-llama/Llama-2-13b-chat-hf","name":"Llama-2-13b-chat-hf","created_by":"meta","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-2","model_type":"chat","parameters":13,"page_url":"https://huggingface.co/meta-llama/Llama-2-13b-chat-hf","release_date":"2023-07-13","license":"llama2","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"context_window":4096,"max_output_tokens":4096},{"id":"meta-llama/Llama-3.1-70B-Instruct","name":"Llama-3.1-70B-Instruct","created_by":"meta","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.1","model_type":"chat","parameters":71,"page_url":"https://huggingface.co/meta-llama/Llama-3.1-70B-Instruct","release_date":"2024-07-16","license":"llama3.1","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":131072,"knowledge_cutoff":"2023-12"},{"id":"meta-llama/Llama-3.1-8B-Instruct","name":"Llama-3.1-8B-Instruct","created_by":"meta","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.1","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/meta-llama/Llama-3.1-8B-Instruct","release_date":"2024-07-18","license":"llama3.1","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":131072,"knowledge_cutoff":"2023-12"},{"id":"meta-llama/Llama-3.2-1B-Instruct","name":"Llama-3.2-1B-Instruct","created_by":"meta","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.2","model_type":"chat","parameters":1.2,"page_url":"https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct","release_date":"2024-09-18","license":"llama3.2","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":131072,"knowledge_cutoff":"2023-12"},{"id":"meta-llama/Llama-3.2-3B-Instruct","name":"Llama-3.2-3B-Instruct","created_by":"meta","source":"official","family":"Llama-3.2","release_date":"2024-09-18","license":"llama3.2","parameters":3.2,"page_url":"https://huggingface.co/meta-llama/Llama-3.2-3B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-14","context_window":131072,"max_output_tokens":131072,"knowledge_cutoff":"2023-12"},{"id":"meta-llama/Llama-3.3-70B-Instruct","name":"Llama-3.3-70B-Instruct","created_by":"meta","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.3","model_type":"chat","parameters":71,"page_url":"https://huggingface.co/meta-llama/Llama-3.3-70B-Instruct","release_date":"2024-11-26","license":"llama3.3","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":131072,"knowledge_cutoff":"2023-12"},{"id":"meta-llama/Meta-Llama-3-70B-Instruct","name":"Meta-Llama-3-70B-Instruct","created_by":"meta","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":71,"page_url":"https://huggingface.co/meta-llama/Meta-Llama-3-70B-Instruct","release_date":"2024-04-17","license":"llama3","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"context_window":8192,"max_output_tokens":8192},{"id":"meta-llama/Meta-Llama-3-8B-Instruct","name":"Meta-Llama-3-8B-Instruct","created_by":"meta","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/meta-llama/Meta-Llama-3-8B-Instruct","release_date":"2024-04-17","license":"llama3","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"context_window":8192,"max_output_tokens":8192},{"id":"microsoft/Phi-3-mini-128k-instruct","name":"Phi-3-mini-128k-instruct","created_by":"microsoft","source":"official","description":"🎉**Phi-4**: [[multimodal-instruct](https://huggingface.co/microsoft/Phi-4-multimodal-instruct) | [onnx](https://huggingface.co/microsoft/Phi-4-multimodal-instruct-onnx)]; [[mini-instruct](https://huggingface.co/microsoft/Phi-4-mini-instruct) | [onnx](https://huggingface.co/microsoft/Phi-4-mini-instruct-onnx)]","release_date":"2024-04-22","context_window":131072,"license":"mit","parameters":3.8,"page_url":"https://huggingface.co/microsoft/Phi-3-mini-128k-instruct","architecture":"transformer","model_type":"chat","tagline":"🎉**Phi-4**: [[multimodal-instruct](https://huggingface.co/microsoft/Phi-4-multimodal-instruct) | [onnx](https://huggingface.co/microsoft/Phi-4-multimodal-instruct-onnx)]; [[mini-instruct](https://hug","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"microsoft/Phi-3-mini-4k-instruct","name":"Phi-3-mini-4k-instruct","created_by":"microsoft","source":"official","description":"🎉 **Phi-3.5**: [[mini-instruct]](https://huggingface.co/microsoft/Phi-3.5-mini-instruct); [[MoE-instruct]](https://huggingface.co/microsoft/Phi-3.5-MoE-instruct) ; [[vision-instruct]](https://huggingface.co/microsoft/Phi-3.5-vision-instruct)","release_date":"2024-04-22","context_window":4096,"license":"mit","parameters":3.8,"page_url":"https://huggingface.co/microsoft/Phi-3-mini-4k-instruct","architecture":"transformer","model_type":"chat","tagline":"🎉 **Phi-3.5**: [[mini-instruct]](https://huggingface.co/microsoft/Phi-3.5-mini-instruct); [[MoE-instruct]](https://huggingface.co/microsoft/Phi-3.5-MoE-instruct) ; [[vision-instruct]](https://hugging","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"microsoft/Phi-4-mini-instruct","name":"Phi-4-mini-instruct","created_by":"microsoft","source":"official","description":"🎉**Phi-4**: [[mini-reasoning](https://huggingface.co/microsoft/Phi-4-mini-reasoning) | [reasoning](https://huggingface.co/microsoft/Phi-4-reasoning)] | [[multimodal-instruct](https://huggingface.co/microsoft/Phi-4-multimodal-instruct) | [onnx](https://huggingface.co/microsoft/Phi-4-multimodal-instruct-onnx)]; [[mini-instruct](https://huggingface.co/microsoft/Phi-4-mini-instruct) | [onnx](https://huggingface.co/microsoft/Phi-4-mini-instruct-onnx)]","release_date":"2025-02-19","context_window":131072,"license":"mit","page_url":"https://huggingface.co/microsoft/Phi-4-mini-instruct","architecture":"transformer","model_type":"chat","tagline":"🎉**Phi-4**: [[mini-reasoning](https://huggingface.co/microsoft/Phi-4-mini-reasoning) | [reasoning](https://huggingface.co/microsoft/Phi-4-reasoning)] | [[multimodal-instruct](https://huggingface.co/m","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29","parameters":3.8},{"id":"mistralai/Mistral-7B-Instruct-v0.1","name":"Mistral-7B-Instruct-v0.1","created_by":"mistral","source":"official","release_date":"2023-09-27","context_window":32768,"license":"apache-2.0","page_url":"https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.1","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-23","parameters":7.2},{"id":"mistralai/Mistral-7B-Instruct-v0.2","name":"Mistral-7B-Instruct-v0.2","created_by":"mistral","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":7.2,"page_url":"https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2","release_date":"2023-12-11","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"mlabonne/Meta-Llama-3.1-8B-Instruct-abliterated","name":"Meta-Llama-3.1-8B-Instruct-abliterated","created_by":"mlabonne","source":"official","last_updated":"2026-03-24","family":"Llama-3.1","page_url":"https://huggingface.co/mlabonne/Meta-Llama-3.1-8B-Instruct-abliterated","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"description":"This is an uncensored version of Llama 3.1 8B Instruct created with abliteration (see [this article](https://huggingface.co/blog/mlabonne/abliteration) to know more about it).","release_date":"2024-07-24","context_window":131072,"license":"llama3.1","parameters":8,"tagline":"This is an uncensored version of Llama 3.1 8B Instruct created with abliteration (see [this article](https://huggingface.co/blog/mlabonne/abliteration) to know more about it).","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"mlabonne/NeuralDaredevil-8B-abliterated","name":"NeuralDaredevil-8B-abliterated","created_by":"mlabonne","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":8,"page_url":"https://huggingface.co/mlabonne/NeuralDaredevil-8B-abliterated","description":"This is a DPO fine-tune of [mlabonne/Daredevil-8-abliterated](https://huggingface.co/mlabonne/Daredevil-8B-abliterated), trained on one epoch of [mlabonne/orpo-dpo-mix-40k](https://huggingface.co/datasets/mlabonne/orpo-dpo-mix-40k). The DPO fine-tuning successfully recovers the performance loss due to the abliteration process, making it an excellent uncensored model.","release_date":"2024-05-27","context_window":8192,"license":"llama3","tagline":"This is a DPO fine-tune of [mlabonne/Daredevil-8-abliterated](https://huggingface.co/mlabonne/Daredevil-8B-abliterated), trained on one epoch of [mlabonne/orpo-dpo-mix-40k](https://huggingface.co/datasets/mlabonne/orpo-dpo-mix-40k).","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"moonshotai/Kimi-K2-Instruct-0905","name":"Kimi-K2-Instruct-0905","created_by":"moonshot","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Kimi-K2","model_type":"chat","page_url":"https://huggingface.co/moonshotai/Kimi-K2-Instruct-0905","release_date":"2025-09-03","context_window":262144,"license":"other","parameters":1026,"architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"moonshotai/Kimi-K2-Instruct","name":"Kimi-K2-Instruct","created_by":"moonshot","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Kimi-K2","model_type":"chat","page_url":"https://huggingface.co/moonshotai/Kimi-K2-Instruct","release_date":"2025-07-11","context_window":131072,"license":"other","parameters":1026,"architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"moonshotai/Kimi-K2-Thinking","name":"Kimi-K2-Thinking","created_by":"moonshot","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true},"family":"Kimi-K2","model_type":"chat","page_url":"https://huggingface.co/moonshotai/Kimi-K2-Thinking","release_date":"2025-11-04","context_window":262144,"license":"other","parameters":1058,"architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Long-term thinking, multi-step tool usage, complex problem solving.","tagline":"Long-term thinking, multi-step tool usage, complex problem solving.","max_output_tokens":32768},{"id":"moonshotai/Kimi-Linear-48B-A3B-Instruct","name":"Kimi-Linear-48B-A3B-Instruct","created_by":"moonshot","source":"official","family":"kimi","release_date":"2025-10-30","license":"mit","parameters":49,"page_url":"https://huggingface.co/moonshotai/Kimi-Linear-48B-A3B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"NousResearch/Meta-Llama-3-70B-Instruct","name":"Meta-Llama-3-70B-Instruct","created_by":"nousresearch","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":71,"page_url":"https://huggingface.co/NousResearch/Meta-Llama-3-70B-Instruct","release_date":"2024-04-19","context_window":8192,"license":"other","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"NousResearch/Meta-Llama-3-8B-Instruct","name":"Meta-Llama-3-8B-Instruct","created_by":"nousresearch","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/NousResearch/Meta-Llama-3-8B-Instruct","release_date":"2024-04-18","context_window":8192,"license":"other","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"NousResearch/Meta-Llama-3.1-8B-Instruct","name":"Meta-Llama-3.1-8B-Instruct","created_by":"nousresearch","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.1","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/NousResearch/Meta-Llama-3.1-8B-Instruct","release_date":"2024-07-24","context_window":131072,"license":"llama3.1","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"nvidia/Gemma-4-31B-IT-NVFP4","name":"Gemma-4-31B-IT-NVFP4","created_by":"nvidia","source":"official","release_date":"2026-04-02","license":"other","parameters":21,"page_url":"https://huggingface.co/nvidia/Gemma-4-31B-IT-NVFP4","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-14"},{"id":"nvidia/Llama-3.1-8B-Instruct-FP8","name":"Llama-3.1-8B-Instruct-FP8","created_by":"nvidia","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.1","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/nvidia/Llama-3.1-8B-Instruct-FP8","release_date":"2024-08-29","context_window":131072,"license":"llama3.1","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"openai/gpt-oss-120b","name":"gpt-oss-120b","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-oss","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"structured_output":true,"reasoning":true,"json_mode":true,"vision":false,"batch":true},"model_type":"chat","parameters":120,"page_url":"https://huggingface.co/openai/gpt-oss-120b","description":"Welcome to the gpt-oss series, [OpenAI’s open-weight models](https://openai.com/open-models) designed for powerful reasoning, agentic tasks, and versatile developer use cases.","release_date":"2025-08-04","context_window":131072,"license":"apache-2.0","tagline":"Welcome to the gpt-oss series, [OpenAI’s open-weight models](https://openai.com/open-models) designed for powerful reasoning, agentic tasks, and versatile developer use cases.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"max_output_tokens":131072,"knowledge_cutoff":"2024-06"},{"id":"openai/gpt-oss-20b","name":"gpt-oss-20b","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-oss","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"structured_output":true,"reasoning":true,"json_mode":true,"vision":false,"batch":true},"model_type":"chat","parameters":22,"page_url":"https://huggingface.co/openai/gpt-oss-20b","description":"Welcome to the gpt-oss series, [OpenAI’s open-weight models](https://openai.com/open-models) designed for powerful reasoning, agentic tasks, and versatile developer use cases.","release_date":"2025-08-04","context_window":131072,"license":"apache-2.0","tagline":"Welcome to the gpt-oss series, [OpenAI’s open-weight models](https://openai.com/open-models) designed for powerful reasoning, agentic tasks, and versatile developer use cases.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"max_output_tokens":131072,"knowledge_cutoff":"2024-06"},{"id":"openai/gpt-oss-safeguard-20b","name":"gpt-oss-safeguard-20b","created_by":"openai","source":"official","last_updated":"2026-05-29","family":"gpt-oss","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"moderation","parameters":22,"page_url":"https://huggingface.co/openai/gpt-oss-safeguard-20b","description":"`gpt-oss-safeguard-120b` and `gpt-oss-safeguard-20b` are safety reasoning models built-upon gpt-oss. With these models, you can classify text content based on safety policies that you provide and perform a suite of foundational safety tasks. These models are intended for safety use cases. For other applications, we recommend using [gpt-oss models](https://huggingface.co/collections/openai/gpt-oss).","release_date":"2025-09-18","context_window":131072,"license":"apache-2.0","tagline":"`gpt-oss-safeguard-120b` and `gpt-oss-safeguard-20b` are safety reasoning models built-upon gpt-oss.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"openchat/openchat-3.6-8b-20240522","name":"openchat-3.6-8b-20240522","created_by":"openchat","source":"official","last_updated":"2026-03-24","alias":"openchat/openchat-3.6-8b","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":8,"page_url":"https://huggingface.co/openchat/openchat-3.6-8b-20240522","description":"To use this model, we highly recommend installing the OpenChat package by following the [installation guide](https://github.com/imoneoi/openchat#installation) in our repository and using the OpenChat OpenAI-compatible API server by running the serving command from the table below. The server is optimized for high-throughput deployment using [vLLM](https://github.com/vllm-project/vllm) and can run on a consumer GPU with 24GB RAM.","release_date":"2024-05-07","context_window":8192,"license":"llama3","tagline":"To use this model, we highly recommend installing the OpenChat package by following the [installation guide](https://github.com/imoneoi/openchat#installation) in our repository and using the OpenChat OpenAI-compatible API server by running the serving command from the table below.","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"openchat/openchat-3.6-8b","name":"openchat-3.6-8b-20240522","created_by":"openchat","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"snapshots":["openchat/openchat-3.6-8b-20240522"],"parameters":8,"page_url":"https://huggingface.co/openchat/openchat-3.6-8b-20240522","description":"To use this model, we highly recommend installing the OpenChat package by following the [installation guide](https://github.com/imoneoi/openchat#installation) in our repository and using the OpenChat OpenAI-compatible API server by running the serving command from the table below. The server is optimized for high-throughput deployment using [vLLM](https://github.com/vllm-project/vllm) and can run on a consumer GPU with 24GB RAM.","release_date":"2024-05-07","context_window":8192,"license":"llama3","tagline":"To use this model, we highly recommend installing the OpenChat package by following the [installation guide](https://github.com/imoneoi/openchat#installation) in our repository and using the OpenChat OpenAI-compatible API server by running the serving command from the table below.","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"openchat/openchat_3.5","name":"openchat_3.5","created_by":"openchat","source":"official","description":"**🔥 The first 7B model Achieves Comparable Results with ChatGPT (March)! 🔥**","release_date":"2023-10-30","context_window":8192,"license":"apache-2.0","page_url":"https://huggingface.co/openchat/openchat_3.5","architecture":"transformer","tagline":"**🔥 The first 7B model Achieves Comparable Results with ChatGPT (March)! 🔥**","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"OpenPipe/Qwen3-14B-Instruct","name":"Qwen3-14B-Instruct","created_by":"openpipe","source":"official","release_date":"2025-10-10","context_window":40960,"license":"apache-2.0","parameters":15,"page_url":"https://huggingface.co/OpenPipe/Qwen3-14B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Orion-zhen/Qwen2.5-7B-Instruct-Uncensored","name":"Qwen2.5-7B-Instruct-Uncensored","created_by":"orion-zhen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":7.6,"page_url":"https://huggingface.co/Orion-zhen/Qwen2.5-7B-Instruct-Uncensored","description":"This model is an uncensored fine-tune version of Qwen2.5-7B-Instruct. However, I can still notice that though uncensored, the model fails to generate detailed descriptions on certain extreme scenarios, which might be associated with deletion on some pretrain datasets in Qwen's pretraining stage.","release_date":"2024-09-26","context_window":32768,"license":"gpl-3.0","tagline":"This model is an uncensored fine-tune version of Qwen2.5-7B-Instruct.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"PatronusAI/Llama-3-Patronus-Lynx-8B-Instruct-v1.1","name":"Llama-3-Patronus-Lynx-8B-Instruct-v1.1","created_by":"patronusai","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/PatronusAI/Llama-3-Patronus-Lynx-8B-Instruct-v1.1","description":"Lynx is an open-source hallucination evaluation model. Patronus-Lynx-8B-Instruct-v1.1 was trained on a mix of datasets including CovidQA, PubmedQA, DROP, RAGTruth. The datasets contain a mix of hand-annotated and synthetic data. The maximum sequence length is 128000 tokens.","release_date":"2024-07-24","context_window":131072,"license":"cc-by-nc-4.0","tagline":"Lynx is an open-source hallucination evaluation model.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"prefeitura-rio/Rio-3.0-Open-Mini","name":"Rio-3.0-Open-Mini","created_by":"prefeitura-rio","source":"official","description":"**Rio 3.0 Open Mini** is a frontier-class reasoning model developed by [IplanRIO](https://iplanrio.rio.rj.gov.br/), the municipal IT company of Rio de Janeiro's city government. Built through distillation on top of Qwen3-4B-Thinking-2507 using reasoning traces from our to be announced Rio 3.0 model, Rio 3.0 Open achieves state-of-the-art results across mathematics, STEM, and code benchmarks — surpassing its base model by significant margins and competing with models far larger than itself.","release_date":"2026-02-09","context_window":262144,"license":"mit","parameters":4,"page_url":"https://huggingface.co/prefeitura-rio/Rio-3.0-Open-Mini","architecture":"transformer","tagline":"**Rio 3.0 Open Mini** is a frontier-class reasoning model developed by [IplanRIO](https://iplanrio.rio.rj.gov.br/), the municipal IT company of Rio de Janeiro's city government.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen1.5-0.5B-Chat","name":"Qwen1.5-0.5B-Chat","created_by":"qwen","source":"official","release_date":"2024-01-31","context_window":32768,"license":"other","parameters":0.62,"page_url":"https://huggingface.co/Qwen/Qwen1.5-0.5B-Chat","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen1.5-1.8B-Chat","name":"Qwen1.5-1.8B-Chat","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":1.8,"page_url":"https://huggingface.co/Qwen/Qwen1.5-1.8B-Chat","release_date":"2024-01-30","context_window":32768,"license":"other","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2-0.5B-Instruct","name":"Qwen2-0.5B-Instruct","created_by":"qwen","source":"official","release_date":"2024-06-03","context_window":32768,"license":"apache-2.0","parameters":0.49,"page_url":"https://huggingface.co/Qwen/Qwen2-0.5B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen2-1.5B-Instruct","name":"Qwen2-1.5B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":1.5,"page_url":"https://huggingface.co/Qwen/Qwen2-1.5B-Instruct","release_date":"2024-06-03","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2-72B-Instruct","name":"Qwen2-72B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":73,"page_url":"https://huggingface.co/Qwen/Qwen2-72B-Instruct","release_date":"2024-05-28","context_window":32768,"license":"other","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Alibaba Cloud's Qwen2 open-source version. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt)","tagline":"The Qwen2 open-source model from Alibaba Cloud.","max_output_tokens":6144},{"id":"Qwen/Qwen2-7B-Instruct","name":"Qwen2-7B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":7.6,"page_url":"https://huggingface.co/Qwen/Qwen2-7B-Instruct","release_date":"2024-06-04","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Alibaba Cloud's Qwen2 open-source version. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt)","tagline":"The Qwen2 open-source model from Alibaba Cloud."},{"id":"Qwen/Qwen2.5-0.5B-Instruct","name":"Qwen2.5-0.5B-Instruct","created_by":"qwen","source":"official","release_date":"2024-09-16","context_window":32768,"license":"apache-2.0","parameters":0.49,"page_url":"https://huggingface.co/Qwen/Qwen2.5-0.5B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen2.5-1.5B-Instruct","name":"Qwen2.5-1.5B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":1.5,"page_url":"https://huggingface.co/Qwen/Qwen2.5-1.5B-Instruct","release_date":"2024-09-17","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-14B-Instruct-1M","name":"Qwen2.5-14B-Instruct-1M","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen2.5-14B-Instruct-1M","release_date":"2025-01-23","context_window":1010000,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Qwen2.5 is part of the Qwen Large Language Model (LLM) series. We released a series of base language models and instruction-tuned language models with parameter scales ranging from 7 billion to 72 billion. Qwen2.5 improves upon Qwen2 in the following ways: * Pre-trained on our latest large-scale dataset containing up to 18 trillion tokens. * Significantly expanded knowledge and greatly enhanced coding and math capabilities due to our domain-expert models. * Major improvements in instruction following, long-text generation (over 8K tokens), structured data understanding (such as tables), and structured output generation (especially JSON). More resilient to diverse system prompts, enhancing chatbot role-playing and conditional setup. * Supports over 29 languages, including Chinese, English, French, Spanish, Portuguese, German, Italian, Russian, Japanese, Korean, Vietnamese, Thai, and Arabic. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt) ## International If you select the [International](https://www.alibabacloud.com/help/en/document_detail/3004398.html#080da663a75xh) deployment scope, model inference compute resources are dynamically scheduled worldwide, excluding the Chinese mainland. Static data is stored in your selected region. Supported region: Singapore.","tagline":"Qwen2.5 is a large language model series from Qwen.","max_output_tokens":8192},{"id":"Qwen/Qwen2.5-14B-Instruct","name":"Qwen2.5-14B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen2.5-14B-Instruct","release_date":"2024-09-16","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Qwen2.5 is part of the Qwen Large Language Model (LLM) series. We released a series of base language models and instruction-tuned language models with parameter scales ranging from 7 billion to 72 billion. Qwen2.5 improves upon Qwen2 in the following ways: * Pre-trained on our latest large-scale dataset containing up to 18 trillion tokens. * Significantly expanded knowledge and greatly enhanced coding and math capabilities due to our domain-expert models. * Major improvements in instruction following, long-text generation (over 8K tokens), structured data understanding (such as tables), and structured output generation (especially JSON). More resilient to diverse system prompts, enhancing chatbot role-playing and conditional setup. * Supports over 29 languages, including Chinese, English, French, Spanish, Portuguese, German, Italian, Russian, Japanese, Korean, Vietnamese, Thai, and Arabic. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt) ## International If you select the [International](https://www.alibabacloud.com/help/en/document_detail/3004398.html#080da663a75xh) deployment scope, model inference compute resources are dynamically scheduled worldwide, excluding the Chinese mainland. Static data is stored in your selected region. Supported region: Singapore.","tagline":"Qwen2.5 is a large language model series from Qwen."},{"id":"Qwen/Qwen2.5-32B-Instruct","name":"Qwen2.5-32B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":33,"page_url":"https://huggingface.co/Qwen/Qwen2.5-32B-Instruct","release_date":"2024-09-17","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Qwen2.5 is part of the Qwen Large Language Model (LLM) series. We released a series of base language models and instruction-tuned language models with parameter scales ranging from 7 billion to 72 billion. Qwen2.5 improves upon Qwen2 in the following ways: * Pre-trained on our latest large-scale dataset containing up to 18 trillion tokens. * Significantly expanded knowledge and greatly enhanced coding and math capabilities due to our domain-expert models. * Major improvements in instruction following, long-text generation (over 8K tokens), structured data understanding (such as tables), and structured output generation (especially JSON). More resilient to diverse system prompts, enhancing chatbot role-playing and conditional setup. * Supports over 29 languages, including Chinese, English, French, Spanish, Portuguese, German, Italian, Russian, Japanese, Korean, Vietnamese, Thai, and Arabic. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt) ## International If you select the [International](https://www.alibabacloud.com/help/en/document_detail/3004398.html#080da663a75xh) deployment scope, model inference compute resources are dynamically scheduled worldwide, excluding the Chinese mainland. Static data is stored in your selected region. Supported region: Singapore.","tagline":"Qwen2.5 is a large language model series from Qwen."},{"id":"Qwen/Qwen2.5-3B-Instruct","name":"Qwen2.5-3B-Instruct","created_by":"qwen","source":"official","release_date":"2024-09-17","context_window":32768,"license":"other","parameters":3.1,"page_url":"https://huggingface.co/Qwen/Qwen2.5-3B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen2.5-72B-Instruct","name":"Qwen2.5-72B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":73,"page_url":"https://huggingface.co/Qwen/Qwen2.5-72B-Instruct","release_date":"2024-09-16","context_window":32768,"license":"other","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Qwen2.5 is part of the Qwen Large Language Model (LLM) series. We released a series of base language models and instruction-tuned language models with parameter scales ranging from 7 billion to 72 billion. Qwen2.5 improves upon Qwen2 in the following ways: * Pre-trained on our latest large-scale dataset containing up to 18 trillion tokens. * Significantly expanded knowledge and greatly enhanced coding and math capabilities due to our domain-expert models. * Major improvements in instruction following, long-text generation (over 8K tokens), structured data understanding (such as tables), and structured output generation (especially JSON). More resilient to diverse system prompts, enhancing chatbot role-playing and conditional setup. * Supports over 29 languages, including Chinese, English, French, Spanish, Portuguese, German, Italian, Russian, Japanese, Korean, Vietnamese, Thai, and Arabic. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt) ## International If you select the [International](https://www.alibabacloud.com/help/en/document_detail/3004398.html#080da663a75xh) deployment scope, model inference compute resources are dynamically scheduled worldwide, excluding the Chinese mainland. Static data is stored in your selected region. Supported region: Singapore.","tagline":"Qwen2.5 is a large language model series from Qwen."},{"id":"Qwen/Qwen2.5-7B-Instruct-1M","name":"Qwen2.5-7B-Instruct-1M","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":7.6,"page_url":"https://huggingface.co/Qwen/Qwen2.5-7B-Instruct-1M","release_date":"2025-01-23","context_window":1010000,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Qwen2.5 is part of the Qwen Large Language Model (LLM) series. We released a series of base language models and instruction-tuned language models with parameter scales ranging from 7 billion to 72 billion. Qwen2.5 improves upon Qwen2 in the following ways: * Pre-trained on our latest large-scale dataset containing up to 18 trillion tokens. * Significantly expanded knowledge and greatly enhanced coding and math capabilities due to our domain-expert models. * Major improvements in instruction following, long-text generation (over 8K tokens), structured data understanding (such as tables), and structured output generation (especially JSON). More resilient to diverse system prompts, enhancing chatbot role-playing and conditional setup. * Supports over 29 languages, including Chinese, English, French, Spanish, Portuguese, German, Italian, Russian, Japanese, Korean, Vietnamese, Thai, and Arabic. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt) ## International If you select the [International](https://www.alibabacloud.com/help/en/document_detail/3004398.html#080da663a75xh) deployment scope, model inference compute resources are dynamically scheduled worldwide, excluding the Chinese mainland. Static data is stored in your selected region. Supported region: Singapore.","tagline":"Qwen2.5 is a large language model series from Qwen."},{"id":"Qwen/Qwen2.5-7B-Instruct","name":"Qwen2.5-7B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":7.6,"page_url":"https://huggingface.co/Qwen/Qwen2.5-7B-Instruct","release_date":"2024-09-16","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"Qwen2.5 is part of the Qwen Large Language Model (LLM) series. We released a series of base language models and instruction-tuned language models with parameter scales ranging from 7 billion to 72 billion. Qwen2.5 improves upon Qwen2 in the following ways: * Pre-trained on our latest large-scale dataset containing up to 18 trillion tokens. * Significantly expanded knowledge and greatly enhanced coding and math capabilities due to our domain-expert models. * Major improvements in instruction following, long-text generation (over 8K tokens), structured data understanding (such as tables), and structured output generation (especially JSON). More resilient to diverse system prompts, enhancing chatbot role-playing and conditional setup. * Supports over 29 languages, including Chinese, English, French, Spanish, Portuguese, German, Italian, Russian, Japanese, Korean, Vietnamese, Thai, and Arabic. [Usage](https://www.alibabacloud.com/help/en/document_detail/2841718.html#24e54b27d4agt) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) \\| [Try online](https://modelstudio.console.alibabacloud.com/?tab=playground#/efm/prompt) ## International If you select the [International](https://www.alibabacloud.com/help/en/document_detail/3004398.html#080da663a75xh) deployment scope, model inference compute resources are dynamically scheduled worldwide, excluding the Chinese mainland. Static data is stored in your selected region. Supported region: Singapore.","tagline":"Qwen2.5 is a large language model series from Qwen."},{"id":"Qwen/Qwen2.5-Coder-0.5B-Instruct","name":"Qwen2.5-Coder-0.5B-Instruct","created_by":"qwen","source":"official","release_date":"2024-11-06","context_window":32768,"license":"apache-2.0","parameters":0.49,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-0.5B-Instruct","architecture":"transformer","model_type":"code","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen2.5-Coder-0.5B","name":"Qwen2.5-Coder-0.5B","created_by":"qwen","source":"official","release_date":"2024-11-08","context_window":32768,"license":"apache-2.0","parameters":0.49,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-0.5B","architecture":"transformer","model_type":"code","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen2.5-Coder-1.5B-Instruct","name":"Qwen2.5-Coder-1.5B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":1.5,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-1.5B-Instruct","release_date":"2024-09-18","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-1.5B","name":"Qwen2.5-Coder-1.5B","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":1.5,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-1.5B","release_date":"2024-09-18","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-14B-Instruct","name":"Qwen2.5-Coder-14B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-14B-Instruct","release_date":"2024-11-06","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-14B","name":"Qwen2.5-Coder-14B","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-14B","release_date":"2024-11-08","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-32B-Instruct","name":"Qwen2.5-Coder-32B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":33,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-32B-Instruct","release_date":"2024-11-06","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-32B","name":"Qwen2.5-Coder-32B","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":33,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-32B","release_date":"2024-11-08","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-3B-Instruct","name":"Qwen2.5-Coder-3B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":3.1,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-3B-Instruct","release_date":"2024-11-06","context_window":32768,"license":"other","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-3B","name":"Qwen2.5-Coder-3B","created_by":"qwen","source":"official","release_date":"2024-11-08","context_window":32768,"license":"other","parameters":3.1,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-3B","architecture":"transformer","model_type":"code","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen2.5-Coder-7B-Instruct","name":"Qwen2.5-Coder-7B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":7.6,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-7B-Instruct","release_date":"2024-09-17","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Coder-7B","name":"Qwen2.5-Coder-7B","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":7.6,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Coder-7B","release_date":"2024-09-16","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Math-1.5B-Instruct","name":"Qwen2.5-Math-1.5B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":1.5,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Math-1.5B-Instruct","description":"> [!Warning] >
> > 🚨 Qwen2.5-Math mainly supports solving English and Chinese math problems through CoT and TIR. We do not recommend using this series of models for other tasks. > >
","release_date":"2024-09-16","context_window":4096,"license":"apache-2.0","tagline":"> [!Warning] >
> > 🚨 Qwen2.5-Math mainly supports solving English and Chinese math problems through CoT and TIR.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen2.5-Math-7B-Instruct","name":"Qwen2.5-Math-7B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":7.6,"page_url":"https://huggingface.co/Qwen/Qwen2.5-Math-7B-Instruct","description":"> [!Warning] >
> > 🚨 Qwen2.5-Math mainly supports solving English and Chinese math problems through CoT and TIR. We do not recommend using this series of models for other tasks. > >
","release_date":"2024-09-19","context_window":4096,"license":"apache-2.0","tagline":"> [!Warning] >
> > 🚨 Qwen2.5-Math mainly supports solving English and Chinese math problems through CoT and TIR.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-0.6B-Base","name":"Qwen3-0.6B-Base","created_by":"qwen","source":"official","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","page_url":"https://huggingface.co/Qwen/Qwen3-0.6B-Base","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-23","parameters":0.6},{"id":"Qwen/Qwen3-0.6B","name":"Qwen3-0.6B","created_by":"qwen","source":"official","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","parameters":0.75,"page_url":"https://huggingface.co/Qwen/Qwen3-0.6B","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen3-1.7B-Base","name":"Qwen3-1.7B-Base","created_by":"qwen","source":"official","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","parameters":1.7,"page_url":"https://huggingface.co/Qwen/Qwen3-1.7B-Base","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen3-1.7B","name":"Qwen3-1.7B","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":2,"page_url":"https://huggingface.co/Qwen/Qwen3-1.7B","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-14B-Base","name":"Qwen3-14B-Base","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen3-14B-Base","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-14B","name":"Qwen3-14B","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen3-14B","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-235B-A22B-Instruct-2507","name":"Qwen3-235B-A22B-Instruct-2507","created_by":"qwen","source":"official","last_updated":"2026-05-23","alias":"Qwen/Qwen3-235B-A22B-Instruct","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":235,"active_parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507","release_date":"2025-07-21","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-235B-A22B-Instruct","name":"Qwen3-235B-A22B-Instruct-2507","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"snapshots":["Qwen/Qwen3-235B-A22B-Instruct-2507"],"model_type":"chat","parameters":235,"active_parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Instruct-2507","release_date":"2025-07-21","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-235B-A22B-Thinking-2507","name":"Qwen3-235B-A22B-Thinking-2507","created_by":"qwen","source":"official","last_updated":"2026-05-23","alias":"Qwen/Qwen3-235B-A22B-Thinking","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":235,"active_parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Thinking-2507","release_date":"2025-07-25","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-235B-A22B-Thinking","name":"Qwen3-235B-A22B-Thinking-2507","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"snapshots":["Qwen/Qwen3-235B-A22B-Thinking-2507"],"model_type":"chat","parameters":235,"active_parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B-Thinking-2507","release_date":"2025-07-25","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-235B-A22B","name":"Qwen3-235B-A22B","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":235,"active_parameters":15,"page_url":"https://huggingface.co/Qwen/Qwen3-235B-A22B","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-30B-A3B-Instruct-2507","name":"Qwen3-30B-A3B-Instruct-2507","created_by":"qwen","source":"official","last_updated":"2026-05-23","alias":"Qwen/Qwen3-30B-A3B-Instruct","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":31,"active_parameters":1.9,"page_url":"https://huggingface.co/Qwen/Qwen3-30B-A3B-Instruct-2507","release_date":"2025-07-28","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-30B-A3B-Instruct","name":"Qwen3-30B-A3B-Instruct-2507","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"snapshots":["Qwen/Qwen3-30B-A3B-Instruct-2507"],"model_type":"chat","parameters":31,"active_parameters":1.9,"page_url":"https://huggingface.co/Qwen/Qwen3-30B-A3B-Instruct-2507","release_date":"2025-07-28","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-30B-A3B-Thinking-2507","name":"Qwen3-30B-A3B-Thinking-2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","release_date":"2025-07-29","context_window":262144,"model_type":"chat","license":"apache-2.0","parameters":31,"active_parameters":1.9,"alias":"Qwen/Qwen3-30B-A3B-Thinking","page_url":"https://huggingface.co/Qwen/Qwen3-30B-A3B-Thinking-2507","architecture":"moe","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"open_weight":true,"tools":["function_calling"]},{"id":"Qwen/Qwen3-30B-A3B-Thinking","name":"Qwen3-30B-A3B-Thinking-2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","release_date":"2025-07-29","context_window":262144,"license":"apache-2.0","parameters":31,"active_parameters":1.9,"page_url":"https://huggingface.co/Qwen/Qwen3-30B-A3B-Thinking-2507","architecture":"moe","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"snapshots":["Qwen/Qwen3-30B-A3B-Thinking-2507"]},{"id":"Qwen/Qwen3-30B-A3B","name":"Qwen3-30B-A3B","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":31,"active_parameters":1.9,"page_url":"https://huggingface.co/Qwen/Qwen3-30B-A3B","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-32B","name":"Qwen3-32B","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":33,"page_url":"https://huggingface.co/Qwen/Qwen3-32B","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-4B-Base","name":"Qwen3-4B-Base","created_by":"qwen","source":"official","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","parameters":4,"page_url":"https://huggingface.co/Qwen/Qwen3-4B-Base","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen3-4B-Instruct-2507","name":"Qwen3-4B-Instruct-2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","alias":"Qwen/Qwen3-4B-Instruct","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":4,"page_url":"https://huggingface.co/Qwen/Qwen3-4B-Instruct-2507","release_date":"2025-08-05","context_window":262144,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-4B-Instruct","name":"Qwen3-4B-Instruct-2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"snapshots":["Qwen/Qwen3-4B-Instruct-2507"],"model_type":"chat","parameters":4,"page_url":"https://huggingface.co/Qwen/Qwen3-4B-Instruct-2507","release_date":"2025-08-05","context_window":262144,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-4B-SafeRL","name":"Qwen3-4B-SafeRL","created_by":"qwen","source":"official","release_date":"2025-09-30","context_window":40960,"license":"apache-2.0","parameters":4.4,"page_url":"https://huggingface.co/Qwen/Qwen3-4B-SafeRL","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen3-4B-Thinking-2507","name":"Qwen3-4B-Thinking-2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","alias":"Qwen/Qwen3-4B-Thinking","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":4,"page_url":"https://huggingface.co/Qwen/Qwen3-4B-Thinking-2507","release_date":"2025-08-05","context_window":262144,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-4B-Thinking","name":"Qwen3-4B-Thinking-2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"snapshots":["Qwen/Qwen3-4B-Thinking-2507"],"model_type":"chat","parameters":4,"page_url":"https://huggingface.co/Qwen/Qwen3-4B-Thinking-2507","release_date":"2025-08-05","context_window":262144,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-4B","name":"Qwen3-4B","created_by":"qwen","source":"official","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","page_url":"https://huggingface.co/Qwen/Qwen3-4B","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-23","parameters":4},{"id":"Qwen/Qwen3-8B-Base","name":"Qwen3-8B-Base","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":8.2,"page_url":"https://huggingface.co/Qwen/Qwen3-8B-Base","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-8B","name":"Qwen3-8B","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":8.2,"page_url":"https://huggingface.co/Qwen/Qwen3-8B","release_date":"2025-04-27","context_window":40960,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-Coder-30B-A3B-Instruct","name":"Qwen3-Coder-30B-A3B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"code","parameters":31,"active_parameters":1.9,"page_url":"https://huggingface.co/Qwen/Qwen3-Coder-30B-A3B-Instruct","release_date":"2025-07-31","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8","name":"Qwen3-Coder-480B-A35B-Instruct-FP8","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":480,"active_parameters":24,"release_date":"2025-07-22","context_window":262144,"license":"apache-2.0","page_url":"https://huggingface.co/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-Coder-480B-A35B-Instruct","name":"Qwen3-Coder-480B-A35B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"code","parameters":480,"active_parameters":24,"page_url":"https://huggingface.co/Qwen/Qwen3-Coder-480B-A35B-Instruct","release_date":"2025-07-22","context_window":262144,"license":"apache-2.0","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-Coder-Next-FP8","name":"Qwen3-Coder-Next-FP8","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","page_url":"https://huggingface.co/Qwen/Qwen3-Coder-Next-FP8","release_date":"2026-02-01","context_window":262144,"license":"apache-2.0","parameters":80,"active_parameters":1.6,"architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-Coder-Next","name":"Qwen3-Coder-Next","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"code","release_date":"2026-01-30","context_window":262144,"license":"apache-2.0","parameters":80,"active_parameters":1.6,"page_url":"https://huggingface.co/Qwen/Qwen3-Coder-Next","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"description":"An open-source code model from Qwen. The latest Qwen3-Coder series delivers strong Coding Agent capabilities. It excels at tool calling and environment interaction. It supports autonomous programming and delivers outstanding coding performance while maintaining broad general-purpose abilities.[How to use](https://www.alibabacloud.com/help/en/document_detail/2850166.html) \\| [API reference](https://www.alibabacloud.com/help/en/document_detail/2712576.html) #### International If you select the [International](https://www.alibabacloud.com/help/en/document_detail/3004398.html#080da663a75xh) deployment scope, model inference compute resources are dynamically scheduled worldwide, excluding the Chinese mainland. Static data is stored in your selected region. Supported region: Singapore.","tagline":"The open-source Qwen code model.","max_output_tokens":65536},{"id":"Qwen/Qwen3-Next-80B-A3B-Instruct","name":"Qwen3-Next-80B-A3B-Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":81,"active_parameters":1.6,"page_url":"https://huggingface.co/Qwen/Qwen3-Next-80B-A3B-Instruct","description":"Over the past few months, we have observed increasingly clear trends toward scaling both total parameters and context lengths in the pursuit of more powerful and agentic artificial intelligence (AI). We are excited to share our latest advancements in addressing these demands, centered on improving scaling efficiency through innovative model architecture. We call this next-generation foundation models **Qwen3-Next**.","release_date":"2025-09-09","context_window":262144,"license":"apache-2.0","tagline":"Over the past few months, we have observed increasingly clear trends toward scaling both total parameters and context lengths in the pursuit of more powerful and agentic artificial intelligence (AI).","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3-Next-80B-A3B-Thinking","name":"Qwen3-Next-80B-A3B-Thinking","created_by":"qwen","source":"official","last_updated":"2026-05-23","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true,"reasoning":true,"structured_output":true,"batch":true,"json_mode":true},"model_type":"chat","parameters":81,"active_parameters":1.6,"page_url":"https://huggingface.co/Qwen/Qwen3-Next-80B-A3B-Thinking","description":"Over the past few months, we have observed increasingly clear trends toward scaling both total parameters and context lengths in the pursuit of more powerful and agentic artificial intelligence (AI). We are excited to share our latest advancements in addressing these demands, centered on improving scaling efficiency through innovative model architecture. We call this next-generation foundation models **Qwen3-Next**.","release_date":"2025-09-09","context_window":262144,"license":"apache-2.0","tagline":"Over the past few months, we have observed increasingly clear trends toward scaling both total parameters and context lengths in the pursuit of more powerful and agentic artificial intelligence (AI).","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"Qwen/Qwen3Guard-Gen-0.6B","name":"Qwen3Guard-Gen-0.6B","created_by":"qwen","source":"official","description":"**Qwen3Guard** is a series of safety moderation models built upon Qwen3 and trained on a dataset of 1.19 million prompts and responses labeled for safety. The series includes models of three sizes (0.6B, 4B, and 8B) and features two specialized variants: **Qwen3Guard-Gen**, a generative model that frames safety classification as an instruction-following task, and **Qwen3Guard-Stream**, which incorporates a token-level classification head for real-time safety monitoring during incremental text ge…","release_date":"2025-09-23","context_window":32768,"license":"apache-2.0","parameters":0.75,"page_url":"https://huggingface.co/Qwen/Qwen3Guard-Gen-0.6B","architecture":"transformer","model_type":"chat","tagline":"**Qwen3Guard** is a series of safety moderation models built upon Qwen3 and trained on a dataset of 1.19 million prompts and responses labeled for safety.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"Qwen/Qwen3Guard-Gen-4B","name":"Qwen3Guard-Gen-4B","created_by":"qwen","source":"official","description":"**Qwen3Guard** is a series of safety moderation models built upon Qwen3 and trained on a dataset of 1.19 million prompts and responses labeled for safety. The series includes models of three sizes (0.6B, 4B, and 8B) and features two specialized variants: **Qwen3Guard-Gen**, a generative model that frames safety classification as an instruction-following task, and **Qwen3Guard-Stream**, which incorporates a token-level classification head for real-time safety monitoring during incremental text ge…","release_date":"2025-09-23","context_window":32768,"license":"apache-2.0","parameters":4.4,"page_url":"https://huggingface.co/Qwen/Qwen3Guard-Gen-4B","architecture":"transformer","model_type":"chat","tagline":"**Qwen3Guard** is a series of safety moderation models built upon Qwen3 and trained on a dataset of 1.19 million prompts and responses labeled for safety.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-17"},{"id":"Qwen/Qwen3Guard-Gen-8B","name":"Qwen3Guard-Gen-8B","created_by":"qwen","source":"official","description":"**Qwen3Guard** is a series of safety moderation models built upon Qwen3 and trained on a dataset of 1.19 million prompts and responses labeled for safety. The series includes models of three sizes (0.6B, 4B, and 8B) and features two specialized variants: **Qwen3Guard-Gen**, a generative model that frames safety classification as an instruction-following task, and **Qwen3Guard-Stream**, which incorporates a token-level classification head for real-time safety monitoring during incremental text ge…","release_date":"2025-09-23","context_window":32768,"license":"apache-2.0","parameters":8.2,"page_url":"https://huggingface.co/Qwen/Qwen3Guard-Gen-8B","architecture":"transformer","model_type":"chat","tagline":"**Qwen3Guard** is a series of safety moderation models built upon Qwen3 and trained on a dataset of 1.19 million prompts and responses labeled for safety.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"RedHatAI/Meta-Llama-3-8B-Instruct-FP8-KV","name":"Meta-Llama-3-8B-Instruct-FP8-KV","created_by":"redhatai","source":"official","last_updated":"2026-03-23","capabilities":{"streaming":true,"tool_call":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/RedHatAI/Meta-Llama-3-8B-Instruct-FP8-KV","release_date":"2024-05-20","context_window":8192,"architecture":"transformer","tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"RedHatAI/Qwen2-1.5B-Instruct-FP8","name":"Qwen2-1.5B-Instruct-FP8","created_by":"redhatai","source":"official","release_date":"2024-06-14","context_window":32768,"license":"apache-2.0","parameters":1.5,"page_url":"https://huggingface.co/RedHatAI/Qwen2-1.5B-Instruct-FP8","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"RedHatAI/Qwen2-7B-Instruct-FP8","name":"Qwen2-7B-Instruct-FP8","created_by":"redhatai","source":"official","release_date":"2024-06-14","context_window":32768,"license":"apache-2.0","parameters":7.6,"page_url":"https://huggingface.co/RedHatAI/Qwen2-7B-Instruct-FP8","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-14"},{"id":"ricdomolm/mini-coder-1.7b","name":"mini-coder-1.7b","created_by":"ricdomolm","source":"official","description":"`mini-coder-1.7b` is a 1.7B parameter model distilled from Qwen 3 Coder 30B A3B. It punches well above its weight, outperforming SWE-agent-LM 7B on [SWE-bench Verified Bash only](https://www.swebench.com/):","release_date":"2025-09-30","context_window":40960,"license":"mit","parameters":1.7,"page_url":"https://huggingface.co/ricdomolm/mini-coder-1.7b","architecture":"transformer","tagline":"`mini-coder-1.7b` is a 1.7B parameter model distilled from Qwen 3 Coder 30B A3B.","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"SakanaAI/TinySwallow-1.5B-Instruct","name":"TinySwallow-1.5B-Instruct","created_by":"sakanaai","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":1.5,"page_url":"https://huggingface.co/SakanaAI/TinySwallow-1.5B-Instruct","description":"🤗 [Models](https://huggingface.co/SakanaAI) | 📚 [Paper](https://arxiv.org/abs/2501.16937) | 📝 [Blog](https://sakana.ai/taid-jp/) | 🐦 [Twitter](https://twitter.com/SakanaAILabs)","release_date":"2025-01-07","context_window":32768,"license":"apache-2.0","tagline":"🤗 [Models](https://huggingface.co/SakanaAI) | 📚 [Paper](https://arxiv.org/abs/2501.16937) | 📝 [Blog](https://sakana.ai/taid-jp/) | 🐦 [Twitter](https://twitter.com/SakanaAILabs)","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"ShahriarFerdoush/llama-3.2-1b-code-instruct","name":"llama-3.2-1b-code-instruct","created_by":"shahriarferdoush","source":"official","family":"llama-3.2","description":"A lightweight yet powerful **code-focused language model** fine-tuned from **Meta Llama-3.2-1B** using **QLoRA (4-bit)** on the **CodeAlpaca-20K** dataset. Designed for **efficient code generation, reasoning, and problem-solving** on limited GPU resources.","release_date":"2025-12-24","context_window":131072,"license":"apache-2.0","parameters":1.2,"page_url":"https://huggingface.co/ShahriarFerdoush/llama-3.2-1b-code-instruct","architecture":"transformer","model_type":"chat","tagline":"A lightweight yet powerful **code-focused language model** fine-tuned from **Meta Llama-3.2-1B** using **QLoRA (4-bit)** on the **CodeAlpaca-20K** dataset.","capabilities":{"streaming":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"last_updated":"2026-05-07"},{"id":"speakleash/Bielik-7B-Instruct-v0.1","name":"Bielik-7B-Instruct-v0.1","created_by":"speakleash","source":"official","last_updated":"2026-03-21","capabilities":{"streaming":true},"parameters":7},{"id":"swap-uniba/LLaMAntino-3-ANITA-8B-Inst-DPO-ITA","name":"LLaMAntino-3-ANITA-8B-Inst-DPO-ITA","created_by":"swap-uniba","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":8,"page_url":"https://huggingface.co/swap-uniba/LLaMAntino-3-ANITA-8B-Inst-DPO-ITA","description":"📣 New MODEL FAMILY❗ [https://huggingface.co/m-polignano/ANITA-NEXT-24B-Magistral-2506-VISION-ITA](https://huggingface.co/m-polignano/ANITA-NEXT-24B-Magistral-2506-VISION-ITA)","release_date":"2024-04-29","context_window":8192,"license":"llama3","tagline":"📣 New MODEL FAMILY❗ [https://huggingface.co/m-polignano/ANITA-NEXT-24B-Magistral-2506-VISION-ITA](https://huggingface.co/m-polignano/ANITA-NEXT-24B-Magistral-2506-VISION-ITA)","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"swiss-ai/Apertus-70B-Instruct-2509","name":"Apertus-70B-Instruct-2509","created_by":"swiss-ai","source":"official","release_date":"2025-09-01","context_window":65536,"license":"apache-2.0","parameters":71,"alias":"swiss-ai/Apertus-70B-Instruct","page_url":"https://huggingface.co/swiss-ai/Apertus-70B-Instruct-2509","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-06-10"},{"id":"swiss-ai/Apertus-70B-Instruct","name":"Apertus-70B-Instruct-2509","created_by":"swiss-ai","source":"official","release_date":"2025-09-01","context_window":65536,"license":"apache-2.0","parameters":71,"page_url":"https://huggingface.co/swiss-ai/Apertus-70B-Instruct-2509","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"snapshots":["swiss-ai/Apertus-70B-Instruct-2509"],"last_updated":"2026-06-10"},{"id":"swiss-ai/Apertus-8B-Instruct-2509","name":"Apertus-8B-Instruct-2509","created_by":"swiss-ai","source":"official","last_updated":"2026-04-21","alias":"swiss-ai/Apertus-8B-Instruct","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"parameters":8.1,"page_url":"https://huggingface.co/swiss-ai/Apertus-8B-Instruct-2509","release_date":"2025-08-13","context_window":65536,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"swiss-ai/Apertus-8B-Instruct","name":"Apertus-8B-Instruct-2509","created_by":"swiss-ai","source":"official","last_updated":"2026-04-21","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"snapshots":["swiss-ai/Apertus-8B-Instruct-2509"],"parameters":8.1,"page_url":"https://huggingface.co/swiss-ai/Apertus-8B-Instruct-2509","release_date":"2025-08-13","context_window":65536,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"]},{"id":"TinyLlama/TinyLlama-1.1B-Chat-v1.0","name":"TinyLlama-1.1B-Chat-v1.0","created_by":"tinyllama","source":"official","release_date":"2023-12-30","context_window":2048,"license":"apache-2.0","parameters":1.1,"page_url":"https://huggingface.co/TinyLlama/TinyLlama-1.1B-Chat-v1.0","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"tokyotech-llm/Llama-3-Swallow-8B-Instruct-v0.1","name":"Llama-3-Swallow-8B-Instruct-v0.1","created_by":"tokyotech-llm","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/tokyotech-llm/Llama-3-Swallow-8B-Instruct-v0.1","description":"Our Swallow model has undergone continual pre-training from the [Llama 3 family](https://huggingface.co/collections/meta-llama/meta-llama-3-66214712577ca38149ebb2b6), primarily with the addition of Japanese language data. The Instruct versions use supervised fine-tuning (SFT) and Chat Vector. Links to other models can be found in the index.","release_date":"2024-06-26","context_window":8192,"license":"llama3","tagline":"Our Swallow model has undergone continual pre-training from the [Llama 3 family](https://huggingface.co/collections/meta-llama/meta-llama-3-66214712577ca38149ebb2b6), primarily with the addition of Japanese language data.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"tokyotech-llm/Llama-3.1-Swallow-8B-Instruct-v0.5","name":"Llama-3.1-Swallow-8B-Instruct-v0.5","created_by":"tokyotech-llm","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.1","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/tokyotech-llm/Llama-3.1-Swallow-8B-Instruct-v0.5","description":"Llama 3.1 Swallow is a series of large language models (8B, 70B) that were built by continual pre-training on the [Meta Llama 3.1](https://huggingface.co/collections/meta-llama/llama-31-669fc079a0c406a149a5738f) models. Llama 3.1 Swallow enhanced the Japanese language capabilities of the original Llama 3.1 while retaining the English language capabilities.","release_date":"2025-06-12","context_window":131072,"license":"llama3.3","tagline":"Llama 3.1 Swallow is a series of large language models (8B, 70B) that were built by continual pre-training on the [Meta Llama 3.1](https://huggingface.co/collections/meta-llama/llama-31-669fc079a0c406a149a5738f) models.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/gemma-2-9b-it","name":"gemma-2-9b-it","created_by":"unsloth","source":"official","last_updated":"2026-03-27","family":"gemma-2","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":9.2,"page_url":"https://huggingface.co/unsloth/gemma-2-9b-it","release_date":"2024-07-03","context_window":8192,"license":"gemma","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/gemma-3-1b-it","name":"gemma-3-1b-it","created_by":"unsloth","source":"official","family":"gemma-3","description":"- Fine-tune Gemma 3 (12B) for free using our Google [Colab notebook here](https://docs.unsloth.ai/get-started/unsloth-notebooks)! - Read our Blog about Gemma 3 support: [unsloth.ai/blog/gemma3](https://unsloth.ai/blog/gemma3) - View the rest of our notebooks in our [docs here](https://docs.unsloth.ai/get-started/unsloth-notebooks). - Export your fine-tuned model to GGUF, Ollama, llama.cpp or 🤗HF.","release_date":"2025-03-12","context_window":32768,"license":"gemma","parameters":1,"page_url":"https://huggingface.co/unsloth/gemma-3-1b-it","architecture":"transformer","model_type":"chat","tagline":"- Fine-tune Gemma 3 (12B) for free using our Google [Colab notebook here](https://docs.unsloth.ai/get-started/unsloth-notebooks)! - Read our Blog about Gemma 3 support: [unsloth.ai/blog/gemma3](https://unsloth.ai/blog/gemma3) - View the rest of our notebooks in our [docs here](https://docs.unsloth.ai/get-started/unsloth-notebooks).","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"unsloth/llama-3-8b-Instruct","name":"llama-3-8b-Instruct","created_by":"unsloth","source":"official","last_updated":"2026-03-24","family":"llama-3","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":8,"page_url":"https://huggingface.co/unsloth/llama-3-8b-Instruct","description":"Directly quantized 4bit model with `bitsandbytes`.","release_date":"2024-04-18","context_window":8192,"license":"llama3","tagline":"Directly quantized 4bit model with `bitsandbytes`.","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Llama-3.1-8B-Instruct","name":"Llama-3.1-8B-Instruct","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.1","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/unsloth/Llama-3.1-8B-Instruct","release_date":"2025-02-15","context_window":131072,"license":"llama3.1","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Llama-3.2-1B-Instruct","name":"Llama-3.2-1B-Instruct","created_by":"unsloth","source":"official","family":"Llama-3.2","release_date":"2024-09-25","context_window":131072,"license":"llama3.2","parameters":1.2,"page_url":"https://huggingface.co/unsloth/Llama-3.2-1B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"unsloth/Llama-3.2-3B-Instruct","name":"Llama-3.2-3B-Instruct","created_by":"unsloth","source":"official","family":"Llama-3.2","release_date":"2024-09-25","context_window":131072,"license":"llama3.2","parameters":3.2,"page_url":"https://huggingface.co/unsloth/Llama-3.2-3B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"unsloth/Llama-3.3-70B-Instruct","name":"Llama-3.3-70B-Instruct","created_by":"unsloth","source":"official","family":"Llama-3.3","release_date":"2024-12-06","context_window":131072,"license":"llama3.3","parameters":71,"page_url":"https://huggingface.co/unsloth/Llama-3.3-70B-Instruct","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-06"},{"id":"unsloth/Meta-Llama-3.1-8B-Instruct","name":"Meta-Llama-3.1-8B-Instruct","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"Llama-3.1","model_type":"chat","parameters":8,"page_url":"https://huggingface.co/unsloth/Meta-Llama-3.1-8B-Instruct","description":"We have a free Google Colab Tesla T4 notebook for Llama 3.1 (8B) here: https://colab.research.google.com/drive/1Ys44kVvmeZtnICzWz0xgpRnrIOjZAuxp?usp=sharing","release_date":"2024-07-23","context_window":131072,"license":"llama3.1","tagline":"We have a free Google Colab Tesla T4 notebook for Llama 3.1 (8B) here: https://colab.research.google.com/drive/1Ys44kVvmeZtnICzWz0xgpRnrIOjZAuxp?usp=sharing","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Mistral-Small-24B-Instruct-2501","name":"Mistral-Small-24B-Instruct-2501","created_by":"unsloth","source":"official","last_updated":"2026-03-24","alias":"unsloth/Mistral-Small-24B-Instruct","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":24,"page_url":"https://huggingface.co/unsloth/Mistral-Small-24B-Instruct-2501","description":"We have a free Google Colab Tesla T4 notebook for Mistral (7B) here: https://colab.research.google.com/github/unslothai/notebooks/blob/main/nb/Mistral_v0.3_(7B)-Conversational.ipynb","release_date":"2025-01-30","context_window":32768,"license":"apache-2.0","tagline":"We have a free Google Colab Tesla T4 notebook for Mistral (7B) here: https://colab.research.google.com/github/unslothai/notebooks/blob/main/nb/Mistral_v0.3_(7B)-Conversational.ipynb","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Mistral-Small-24B-Instruct","name":"Mistral-Small-24B-Instruct-2501","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"snapshots":["unsloth/Mistral-Small-24B-Instruct-2501"],"model_type":"chat","parameters":24,"page_url":"https://huggingface.co/unsloth/Mistral-Small-24B-Instruct-2501","description":"We have a free Google Colab Tesla T4 notebook for Mistral (7B) here: https://colab.research.google.com/github/unslothai/notebooks/blob/main/nb/Mistral_v0.3_(7B)-Conversational.ipynb","release_date":"2025-01-30","context_window":32768,"license":"apache-2.0","tagline":"We have a free Google Colab Tesla T4 notebook for Mistral (7B) here: https://colab.research.google.com/github/unslothai/notebooks/blob/main/nb/Mistral_v0.3_(7B)-Conversational.ipynb","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Qwen2.5-0.5B-Instruct","name":"Qwen2.5-0.5B-Instruct","created_by":"unsloth","source":"official","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-09-18","context_window":32768,"license":"apache-2.0","parameters":0.49,"page_url":"https://huggingface.co/unsloth/Qwen2.5-0.5B-Instruct","architecture":"transformer","model_type":"chat","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"unsloth/Qwen2.5-1.5B-Instruct","name":"Qwen2.5-1.5B-Instruct","created_by":"unsloth","source":"official","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-09-18","context_window":32768,"license":"apache-2.0","parameters":1.5,"page_url":"https://huggingface.co/unsloth/Qwen2.5-1.5B-Instruct","architecture":"transformer","model_type":"chat","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"unsloth/Qwen2.5-14B-Instruct","name":"Qwen2.5-14B-Instruct","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":15,"page_url":"https://huggingface.co/unsloth/Qwen2.5-14B-Instruct","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-09-23","context_window":32768,"license":"apache-2.0","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Qwen2.5-32B-Instruct","name":"Qwen2.5-32B-Instruct","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":33,"page_url":"https://huggingface.co/unsloth/Qwen2.5-32B-Instruct","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-09-23","context_window":32768,"license":"apache-2.0","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Qwen2.5-3B-Instruct","name":"Qwen2.5-3B-Instruct","created_by":"unsloth","source":"official","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-09-18","context_window":32768,"license":"other","parameters":3.1,"page_url":"https://huggingface.co/unsloth/Qwen2.5-3B-Instruct","architecture":"transformer","model_type":"chat","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"unsloth/Qwen2.5-7B-Instruct","name":"Qwen2.5-7B-Instruct","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":7.6,"page_url":"https://huggingface.co/unsloth/Qwen2.5-7B-Instruct","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-09-18","context_window":32768,"license":"apache-2.0","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Qwen2.5-Coder-32B-Instruct","name":"Qwen2.5-Coder-32B-Instruct","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"code","parameters":33,"page_url":"https://huggingface.co/unsloth/Qwen2.5-Coder-32B-Instruct","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-11-12","context_window":32768,"license":"apache-2.0","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/Qwen2.5-Coder-7B-Instruct","name":"Qwen2.5-Coder-7B-Instruct","created_by":"unsloth","source":"official","description":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing). Also a [Qwen 2.5 conversational style notebook](https://colab.research.google.com/drive/1qN1CEalC70EO1wGKhNxs1go1W9So61R5?usp=sharing).","release_date":"2024-09-23","context_window":32768,"license":"apache-2.0","parameters":7.6,"page_url":"https://huggingface.co/unsloth/Qwen2.5-Coder-7B-Instruct","architecture":"transformer","model_type":"code","tagline":"We have a Qwen 2.5 (all model sizes) [free Google Colab Tesla T4 notebook](https://colab.research.google.com/drive/1Kose-ucXO1IBaZq5BvbwWieuubP7hxvQ?usp=sharing).","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-16"},{"id":"unsloth/Qwen3-1.7B-Base","name":"Qwen3-1.7B-Base","created_by":"unsloth","source":"official","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","page_url":"https://huggingface.co/unsloth/Qwen3-1.7B-Base","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"last_updated":"2026-05-17"},{"id":"unsloth/Qwen3-4B-Base","name":"Qwen3-4B-Base","created_by":"unsloth","source":"official","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","page_url":"https://huggingface.co/unsloth/Qwen3-4B-Base","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"last_updated":"2026-06-02"},{"id":"unsloth/Qwen3-4B-Instruct-2507","name":"Qwen3-4B-Instruct-2507","created_by":"unsloth","source":"official","release_date":"2025-08-06","context_window":262144,"model_type":"chat","license":"apache-2.0","alias":"unsloth/Qwen3-4B-Instruct","page_url":"https://huggingface.co/unsloth/Qwen3-4B-Instruct-2507","architecture":"transformer","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"open_weight":true,"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"unsloth/Qwen3-4B-Instruct","name":"Qwen3-4B-Instruct-2507","created_by":"unsloth","source":"official","release_date":"2025-08-06","context_window":262144,"license":"apache-2.0","page_url":"https://huggingface.co/unsloth/Qwen3-4B-Instruct-2507","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"snapshots":["unsloth/Qwen3-4B-Instruct-2507"],"last_updated":"2026-05-01"},{"id":"unsloth/Qwen3-8B-Base","name":"Qwen3-8B-Base","created_by":"unsloth","source":"official","release_date":"2025-04-28","context_window":32768,"license":"apache-2.0","page_url":"https://huggingface.co/unsloth/Qwen3-8B-Base","architecture":"transformer","model_type":"chat","capabilities":{"streaming":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"last_updated":"2026-03-26"},{"id":"unsloth/Qwen3-8B","name":"Qwen3-8B","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"model_type":"chat","parameters":8,"page_url":"https://huggingface.co/unsloth/Qwen3-8B","release_date":"2025-04-28","context_window":40960,"license":"apache-2.0","architecture":"transformer","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"unsloth/tinyllama-chat","name":"tinyllama-chat","created_by":"unsloth","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"page_url":"https://huggingface.co/unsloth/tinyllama-chat","description":"[](https://discord.gg/u54VK8m8tk) [](https://ko-fi.com/unsloth) [](https://github.com/unslothai/unsloth)","release_date":"2024-02-14","context_window":2048,"license":"apache-2.0","parameters":1.1,"tagline":"[](https://discord.gg/u54VK8m8tk) [Discord community.","release_date":"2025-07-20","context_window":131072,"license":"mit","tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-4.5-Air","name":"GLM-4.5-Air","created_by":"zhipu","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-4.5","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-4.5-Air","description":"👋 Join our Discord community.","release_date":"2025-07-20","context_window":131072,"license":"mit","parameters":110,"tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-4.5","name":"GLM-4.5","created_by":"zhipu","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-4.5","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-4.5","description":"👋 Join our Discord community.","release_date":"2025-07-20","context_window":131072,"license":"mit","parameters":358,"tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-4.6-FP8","name":"GLM-4.6-FP8","created_by":"zhipu","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-4.6","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-4.6-FP8","description":"👋 Join our Discord community.","release_date":"2025-09-29","context_window":202752,"license":"mit","tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-4.6","name":"GLM-4.6","created_by":"zhipu","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-4.6","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-4.6","description":"👋 Join our Discord community.","release_date":"2025-09-29","context_window":202752,"license":"mit","parameters":357,"tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-4.7-Flash","name":"GLM-4.7-Flash","created_by":"zhipu","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-4.7","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-4.7-Flash","description":"👋 Join our Discord community.","release_date":"2026-01-19","context_window":202752,"license":"mit","parameters":31,"tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-4.7-FP8","name":"GLM-4.7-FP8","created_by":"zhipu","source":"official","last_updated":"2026-05-29","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-4.7","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-4.7-FP8","description":"👋 Join our Discord community.","release_date":"2025-12-22","context_window":202752,"license":"mit","tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]},"parameters":358},{"id":"zai-org/GLM-4.7","name":"GLM-4.7","created_by":"zhipu","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-4.7","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-4.7","description":"👋 Join our Discord community.","release_date":"2025-12-22","context_window":202752,"license":"mit","parameters":358,"tagline":"👋 Join our Discord community.","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-5.1-FP8","name":"GLM-5.1-FP8","created_by":"zhipu","source":"official","family":"GLM-5.1","release_date":"2026-04-03","context_window":202752,"license":"mit","parameters":754,"page_url":"https://huggingface.co/zai-org/GLM-5.1-FP8","architecture":"moe","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-10"},{"id":"zai-org/GLM-5.1","name":"GLM-5.1","created_by":"zhipu","source":"official","family":"GLM-5.1","release_date":"2026-04-03","context_window":202752,"license":"mit","parameters":754,"page_url":"https://huggingface.co/zai-org/GLM-5.1","architecture":"moe","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-12"},{"id":"zai-org/GLM-5.2-FP8","name":"GLM-5.2-FP8","created_by":"zhipu","source":"official","family":"GLM-5.2","release_date":"2026-06-16","context_window":1048576,"license":"mit","parameters":753,"page_url":"https://huggingface.co/zai-org/GLM-5.2-FP8","architecture":"moe","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-20"},{"id":"zai-org/GLM-5.2","name":"GLM-5.2","created_by":"zhipu","source":"official","family":"GLM-5.2","release_date":"2026-06-16","context_window":1048576,"license":"mit","parameters":753,"page_url":"https://huggingface.co/zai-org/GLM-5.2","architecture":"moe","model_type":"chat","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"open_weight":true,"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"zai-org/GLM-5","name":"GLM-5","created_by":"zhipu","source":"official","last_updated":"2026-03-24","capabilities":{"streaming":true,"tool_call":true,"fine_tuning":true},"family":"GLM-5","model_type":"chat","page_url":"https://huggingface.co/zai-org/GLM-5","description":"👋 Join our WeChat or Discord community.","release_date":"2026-02-11","context_window":202752,"license":"mit","parameters":754,"tagline":"👋 Join our WeChat or Discord","architecture":"moe","open_weight":true,"tools":["function_calling"],"modalities":{"input":["text"],"output":["text"]}},{"id":"zai-org/GLM-Z1-32B-0414","name":"GLM-Z1-32B-0414","created_by":"zhipu","source":"official","last_updated":"2026-03-21","capabilities":{"streaming":true},"model_type":"chat","family":"glm","parameters":32}]}; export const models: Model[] = provider.models.map((m) => ({ ...m, provider: provider.id })); diff --git a/packages/npm/src/providers/openrouter.ts b/packages/npm/src/providers/openrouter.ts index ed37ed98d..385623786 100644 --- a/packages/npm/src/providers/openrouter.ts +++ b/packages/npm/src/providers/openrouter.ts @@ -3,6 +3,6 @@ import type { ProviderWithModels, Model } from '../types'; -export const provider: ProviderWithModels = {"id":"openrouter","name":"OpenRouter","region":"US","headquarters":"New York, NY","founded":2023,"url":"https://openrouter.ai","api_url":"https://openrouter.ai/api/v1","docs_url":"https://openrouter.ai/docs","pricing_url":"https://openrouter.ai/models","description":"Unified API gateway providing access to 200+ models from multiple providers with standardized pricing.","type":"aggregator","playground_url":"https://openrouter.ai/playground","status_url":"https://status.openrouter.ai","openai_compatible":true,"free_tier":true,"github_url":"https://github.com/OpenRouterTeam","models_url":"https://openrouter.ai/models","twitter_url":"https://x.com/OpenRouterAI","discord_url":"https://discord.com/invite/openrouter","terms_url":"https://openrouter.ai/terms","support_url":"https://openrouter.ai/support","icon":"\n \n","models":[{"id":"~anthropic/claude-fable-latest","name":"Anthropic: Claude Fable Latest","created_by":"~anthropic","source":"official","family":"claude-fable","description":"This model always redirects to the latest model in the Claude Fable family.","release_date":"2026-06-09","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"This model always redirects to the latest model in the Claude Fable family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":10,"output":50,"cached_input":1},"tools":["function_calling"],"last_updated":"2026-06-18"},{"id":"~anthropic/claude-haiku-latest","name":"Anthropic Claude Haiku Latest","created_by":"~anthropic","source":"official","family":"claude-haiku","description":"This model always redirects to the latest model in the Anthropic Claude Haiku family.","release_date":"2026-04-27","context_window":200000,"max_output_tokens":64000,"model_type":"chat","tagline":"This model always redirects to the latest model in the Anthropic Claude Haiku family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1,"output":5,"cached_input":0.1},"tools":["function_calling"],"last_updated":"2026-05-14"},{"id":"~anthropic/claude-opus-latest","name":"Anthropic: Claude Opus Latest","created_by":"~anthropic","source":"official","family":"claude-opus","description":"This model always redirects to the latest model in the Claude Opus family.","release_date":"2026-04-21","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"This model always redirects to the latest model in the Claude Opus family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5,"output":25,"cached_input":0.5},"tools":["function_calling"],"last_updated":"2026-04-22"},{"id":"~anthropic/claude-sonnet-latest","name":"Anthropic Claude Sonnet Latest","created_by":"~anthropic","source":"official","family":"claude-sonnet","description":"This model always redirects to the latest model in the Anthropic Claude Sonnet family.","release_date":"2026-04-27","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"This model always redirects to the latest model in the Anthropic Claude Sonnet family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":3,"output":15,"cached_input":0.3},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"~google/gemini-flash-latest","name":"Google Gemini Flash Latest","created_by":"~google","source":"official","description":"This model always redirects to the latest model in the Google Gemini Flash family.","release_date":"2026-04-27","context_window":1048576,"max_output_tokens":65536,"model_type":"chat","tagline":"This model always redirects to the latest model in the Google Gemini Flash family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"pricing":{"input":1.5,"output":9,"cached_input":0.15},"tools":["function_calling"],"last_updated":"2026-05-23"},{"id":"~google/gemini-pro-latest","name":"Google Gemini Pro Latest","created_by":"~google","source":"official","description":"This model always redirects to the latest model in the Google Gemini Pro family.","release_date":"2026-04-27","context_window":1048576,"max_output_tokens":65536,"model_type":"chat","tagline":"This model always redirects to the latest model in the Google Gemini Pro family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["audio","image","text","video"],"output":["text"]},"pricing":{"input":2,"output":12,"cached_input":0.2},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"~moonshotai/kimi-latest","name":"MoonshotAI Kimi Latest","created_by":"~moonshotai","source":"official","family":"kimi","description":"This model always redirects to the latest model in the MoonshotAI Kimi family.","release_date":"2026-04-27","context_window":262144,"max_output_tokens":262144,"model_type":"chat","tagline":"This model always redirects to the latest model in the MoonshotAI Kimi family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.55,"output":3.2,"cached_input":0.11},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"~openai/gpt-latest","name":"OpenAI GPT Latest","created_by":"~openai","source":"official","description":"This model always redirects to the latest model in the OpenAI GPT family.","release_date":"2026-04-27","context_window":1050000,"max_output_tokens":128000,"tagline":"This model always redirects to the latest model in the OpenAI GPT family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["image","text"],"output":["text"]},"pricing":{"input":5,"output":30,"cached_input":0.5},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"~openai/gpt-mini-latest","name":"OpenAI GPT Mini Latest","created_by":"~openai","source":"official","description":"This model always redirects to the latest model in the OpenAI GPT Mini family.","release_date":"2026-04-27","context_window":400000,"max_output_tokens":128000,"tagline":"This model always redirects to the latest model in the OpenAI GPT Mini family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["image","text"],"output":["text"]},"pricing":{"input":0.75,"output":4.5,"cached_input":0.075},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"ai21/jamba-large-1.7","name":"AI21: Jamba Large 1.7","created_by":"ai21","source":"official","last_updated":"2026-03-24","description":"Jamba Large 1.7 is the latest model in the Jamba open family, offering improvements in grounding, instruction-following, and overall efficiency.","context_window":256000,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":2,"output":8},"model_type":"chat","release_date":"2025-08-08","tagline":"Jamba Large 1.7 is the latest model in the Jamba open family, offering improvements in grounding, instruction-following, and overall efficiency.","tools":["function_calling"]},{"id":"aion-labs/aion-1.0-mini","name":"AionLabs: Aion-1.0-Mini","created_by":"aion-labs","source":"official","last_updated":"2026-03-23","description":"Aion-1.0-Mini 32B parameter model is a distilled version of the DeepSeek-R1 model, designed for strong performance in reasoning domains such as mathematics, coding, and logic.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"reasoning":true},"pricing":{"input":0.7,"output":1.4},"release_date":"2025-02-04","tagline":"Aion-1.0-Mini 32B parameter model is a distilled version of the DeepSeek-R1 model, designed for strong performance in reasoning domains such as mathematics, coding, and logic."},{"id":"aion-labs/aion-1.0","name":"AionLabs: Aion-1.0","created_by":"aion-labs","source":"official","last_updated":"2026-03-23","description":"Aion-1.0 is a multi-model system designed for high performance across various tasks, including reasoning and coding.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"reasoning":true},"pricing":{"input":4,"output":8},"release_date":"2025-02-04","tagline":"Aion-1.0 is a multi-model system designed for high performance across various tasks, including reasoning and coding."},{"id":"aion-labs/aion-2.0","name":"AionLabs: Aion-2.0","created_by":"aion-labs","source":"official","last_updated":"2026-03-23","description":"Aion-2.0 is a variant of DeepSeek V3.2 optimized for immersive roleplaying and storytelling.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"reasoning":true},"pricing":{"input":0.8,"output":1.6,"cached_input":0.2},"release_date":"2026-02-23","tagline":"Aion-2.0 is a variant of DeepSeek V3.2 optimized for immersive roleplaying and storytelling."},{"id":"aion-labs/aion-rp-llama-3.1-8b","name":"AionLabs: Aion-RP 1.0 (8B)","created_by":"aion-labs","source":"official","last_updated":"2026-03-23","description":"Aion-RP-Llama-3.1-8B ranks the highest in the character evaluation portion of the RPBench-Auto benchmark, a roleplaying-specific variant of Arena-Hard-Auto, where LLMs evaluate each other’s responses.","context_window":32768,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.8,"output":1.6},"parameters":8,"release_date":"2025-02-04","tagline":"Aion-RP-Llama-3.1-8B ranks the highest in the character evaluation portion of the RPBench-Auto benchmark, a roleplaying-specific variant of Arena-Hard-Auto, where LLMs evaluate each other’s responses."},{"id":"alfredpros/codellama-7b-instruct-solidity","name":"AlfredPros: CodeLLaMa 7B Instruct Solidity","created_by":"alfredpros","source":"official","last_updated":"2026-03-23","description":"A finetuned 7 billion parameters Code LLaMA - Instruct model to generate Solidity smart contract using 4-bit QLoRA finetuning provided by PEFT library.","context_window":4096,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.8,"output":1.2},"family":"codellama","model_type":"code","parameters":7,"release_date":"2025-04-14","tagline":"A finetuned 7 billion parameters Code LLaMA - Instruct model to generate Solidity smart contract using 4-bit QLoRA finetuning provided by PEFT library."},{"id":"alibaba/tongyi-deepresearch-30b-a3b","name":"Tongyi DeepResearch 30B A3B","created_by":"alibaba","source":"official","last_updated":"2026-03-24","description":"Tongyi DeepResearch is an agentic large language model developed by Tongyi Lab, with 30 billion total parameters activating only 3 billion per token.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.09,"output":0.45,"cached_input":0.09},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-09-18","tagline":"Tongyi DeepResearch is an agentic large language model developed by Tongyi Lab, with 30 billion total parameters activating only 3 billion per token.","tools":["function_calling"]},{"id":"allenai/molmo-2-8b","name":"AllenAI: Molmo2 8B","created_by":"allenai","source":"official","last_updated":"2026-03-21","description":"Molmo2-8B is an open vision-language model developed by the Allen Institute for AI (Ai2) as part of the Molmo2 family, supporting image, video, and multi-image understanding and grounding.","status":"deprecated","deprecation_date":"2026-03-23","context_window":36864,"max_output_tokens":36864,"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.2,"output":0.2},"parameters":8},{"id":"allenai/olmo-2-0325-32b-instruct","name":"AllenAI: Olmo 2 32B Instruct","created_by":"allenai","source":"official","last_updated":"2026-03-23","description":"OLMo-2 32B Instruct is a supervised instruction-finetuned variant of the OLMo-2 32B March 2025 base model.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.05,"output":0.2},"parameters":32,"release_date":"2025-03-14","tagline":"OLMo-2 32B Instruct is a supervised instruction-finetuned variant of the OLMo-2 32B March 2025 base model."},{"id":"allenai/olmo-3-32b-think","name":"AllenAI: Olmo 3 32B Think","created_by":"allenai","source":"official","last_updated":"2026-03-24","description":"Olmo 3 32B Think is a large-scale, 32-billion-parameter model purpose-built for deep reasoning, complex logic chains and advanced instruction-following scenarios.","context_window":65536,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.15,"output":0.5},"parameters":32,"release_date":"2025-11-21","tagline":"Olmo 3 32B Think is a large-scale, 32-billion-parameter model purpose-built for deep reasoning, complex logic chains and advanced instruction-following scenarios."},{"id":"allenai/olmo-3-7b-instruct","name":"AllenAI: Olmo 3 7B Instruct","created_by":"allenai","source":"official","last_updated":"2026-03-21","description":"Olmo 3 7B Instruct is a supervised instruction-fine-tuned variant of the Olmo 3 7B base model, optimized for instruction-following, question-answering, and natural conversational dialogue.","status":"deprecated","deprecation_date":"2026-03-23","context_window":65536,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.1,"output":0.2},"parameters":7},{"id":"allenai/olmo-3-7b-think","name":"AllenAI: Olmo 3 7B Think","created_by":"allenai","source":"official","last_updated":"2026-03-21","description":"Olmo 3 7B Think is a research-oriented language model in the Olmo family designed for advanced reasoning and instruction-driven tasks.","status":"deprecated","deprecation_date":"2026-03-23","context_window":65536,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.12,"output":0.2},"parameters":7},{"id":"allenai/olmo-3.1-32b-instruct","name":"AllenAI: Olmo 3.1 32B Instruct","created_by":"allenai","source":"official","last_updated":"2026-05-01","description":"Olmo 3.1 32B Instruct is a large-scale, 32-billion-parameter instruction-tuned language model engineered for high-performance conversational AI, multi-turn dialogue, and practical instruction following.","context_window":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.2,"output":0.6},"parameters":32,"release_date":"2026-01-06","tagline":"Olmo 3.1 32B Instruct is a large-scale, 32-billion-parameter instruction-tuned language model engineered for high-performance conversational AI, multi-turn dialogue, and practical instruction followin","tools":["function_calling"],"max_output_tokens":16384,"status":"deprecated","deprecation_date":"2026-05-07"},{"id":"allenai/olmo-3.1-32b-think","name":"AllenAI: Olmo 3.1 32B Think","created_by":"allenai","source":"official","last_updated":"2026-03-24","description":"Olmo 3.1 32B Think is a large-scale, 32-billion-parameter model designed for deep reasoning, complex multi-step logic, and advanced instruction following.","context_window":65536,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.15,"output":0.5},"parameters":32,"status":"deprecated","release_date":"2025-12-16","deprecation_date":"2026-04-06","tagline":"Olmo 3.1 32B Think is a large-scale, 32-billion-parameter model designed for deep reasoning, complex multi-step logic, and advanced instruction following."},{"id":"alpindale/goliath-120b","name":"Goliath 120B","created_by":"alpindale","source":"official","last_updated":"2026-03-24","description":"A large LLM created by combining two fine-tuned Llama 70B models into one 120B model.","context_window":6144,"max_output_tokens":1024,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":3.75,"output":7.5},"parameters":120,"release_date":"2023-11-10","tagline":"A large LLM created by combining two fine-tuned Llama 70B models into one 120B model."},{"id":"amazon/nova-2-lite-v1","name":"Amazon: Nova 2 Lite","created_by":"amazon","source":"official","last_updated":"2026-03-23","description":"Nova 2 Lite is a fast, cost-effective reasoning model for everyday workloads that can process text, images, and videos to generate text.","context_window":1000000,"max_output_tokens":65535,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"pricing":{"input":0.3,"output":2.5},"model_type":"chat","release_date":"2025-12-02","tagline":"Nova 2 Lite is a fast, cost-effective reasoning model for everyday workloads that can process text, images, and videos to generate text.","tools":["function_calling"]},{"id":"amazon/nova-lite-v1","name":"Amazon: Nova Lite 1.0","created_by":"amazon","source":"official","last_updated":"2026-03-23","description":"Amazon Nova Lite 1.0 is a very low-cost multimodal model from Amazon that focused on fast processing of image, video, and text inputs to generate text output.","context_window":300000,"max_output_tokens":5120,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":0.06,"output":0.24},"model_type":"chat","release_date":"2024-12-05","tagline":"Amazon Nova Lite 1.0 is a very low-cost multimodal model from Amazon that focused on fast processing of image, video, and text inputs to generate text output.","tools":["function_calling"]},{"id":"amazon/nova-micro-v1","name":"Amazon: Nova Micro 1.0","created_by":"amazon","source":"official","last_updated":"2026-03-23","description":"Amazon Nova Micro 1.0 is a text-only model that delivers the lowest latency responses in the Amazon Nova family of models at a very low cost.","context_window":128000,"max_output_tokens":5120,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":0.035,"output":0.14},"model_type":"chat","release_date":"2024-12-05","tagline":"Amazon Nova Micro 1.0 is a text-only model that delivers the lowest latency responses in the Amazon Nova family of models at a very low cost.","tools":["function_calling"]},{"id":"amazon/nova-premier-v1","name":"Amazon: Nova Premier 1.0","created_by":"amazon","source":"official","last_updated":"2026-03-23","description":"Amazon Nova Premier is the most capable of Amazon’s multimodal models for complex reasoning tasks and for use as the best teacher for distilling custom models.","context_window":1000000,"max_output_tokens":32000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":2.5,"output":12.5,"cached_input":0.625},"model_type":"chat","release_date":"2025-10-31","tagline":"Amazon Nova Premier is the most capable of Amazon’s multimodal models for complex reasoning tasks and for use as the best teacher for distilling custom models.","tools":["function_calling"]},{"id":"amazon/nova-pro-v1","name":"Amazon: Nova Pro 1.0","created_by":"amazon","source":"official","last_updated":"2026-03-23","description":"Amazon Nova Pro 1.0 is a capable multimodal model from Amazon focused on providing a combination of accuracy, speed, and cost for a wide range of tasks.","context_window":300000,"max_output_tokens":5120,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":0.8,"output":3.2},"model_type":"chat","release_date":"2024-12-05","tagline":"Amazon Nova Pro 1.0 is a capable multimodal model from Amazon focused on providing a combination of accuracy, speed, and cost for a wide range of tasks.","tools":["function_calling"]},{"id":"anthracite-org/magnum-v4-72b","name":"Magnum v4 72B","created_by":"anthracite-org","source":"official","last_updated":"2026-05-17","description":"This is a series of models designed to replicate the prose quality of the Claude 3 models, specifically Sonnet(https://openrouter.ai/anthropic/claude-3.5-sonnet) and Opus(https://openrouter.ai/anthropic/claude-3-opus).","context_window":32768,"max_output_tokens":2048,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":3,"output":5},"parameters":72,"release_date":"2024-10-22","tagline":"This is a series of models designed to replicate the prose quality of the Claude 3 models, specifically Sonnet(https://openrouter.ai/anthropic/claude-3.5-sonnet) and Opus(https://openrouter.ai/anthrop"},{"id":"anthropic/claude-3-haiku","name":"Anthropic: Claude 3 Haiku","created_by":"anthropic","source":"official","last_updated":"2026-03-23","family":"claude-haiku","description":"Claude 3 Haiku is Anthropic's fastest and most compact model for\nnear-instant responsiveness. Quick and accurate targeted performance.\n\nSee the launch announcement and benchmark results [here](https:/","context_window":200000,"max_output_tokens":4096,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"streaming":true,"vision":true,"batch":true},"pricing":{"input":0.25,"output":1.25,"cached_input":0.03},"model_type":"chat","release_date":"2024-03-13","tagline":"Claude 3 Haiku is Anthropic's fastest and most compact model for\nnear-instant responsiveness. Quick and accurate targeted performance.\n\nSee the launch announcement and benchmark results [here](https:/","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"anthropic/claude-3.5-haiku","name":"Anthropic: Claude 3.5 Haiku","created_by":"anthropic","source":"official","last_updated":"2026-03-23","family":"claude-haiku","description":"Claude 3.5 Haiku features offers enhanced capabilities in speed, coding accuracy, and tool use.","context_window":200000,"max_output_tokens":8192,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":0.8,"output":4,"cached_input":0.08},"model_type":"chat","release_date":"2024-11-04","tagline":"Claude 3.5 Haiku features offers enhanced capabilities in speed, coding accuracy, and tool use.","tools":["function_calling"]},{"id":"anthropic/claude-3.5-sonnet","name":"Anthropic: Claude 3.5 Sonnet","created_by":"anthropic","source":"official","last_updated":"2026-03-23","family":"claude-sonnet","description":"New Claude 3.5 Sonnet delivers better-than-Opus capabilities, faster-than-Sonnet speeds, at the same Sonnet prices.","context_window":200000,"max_output_tokens":8192,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":6,"output":30,"cached_input":0.6},"model_type":"chat","release_date":"2024-10-22","tagline":"New Claude 3.5 Sonnet delivers better-than-Opus capabilities, faster-than-Sonnet speeds, at the same Sonnet prices.","tools":["function_calling"]},{"id":"anthropic/claude-3.7-sonnet:thinking","name":"Anthropic: Claude 3.7 Sonnet (thinking)","created_by":"anthropic","source":"official","last_updated":"2026-05-06","family":"claude-sonnet","description":"Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities.","status":"deprecated","deprecation_date":"2026-05-11","context_window":200000,"max_output_tokens":64000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"pricing":{"input":3,"output":15,"cached_input":0.3},"model_type":"chat","release_date":"2025-02-24","tagline":"Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities.","tools":["function_calling"]},{"id":"anthropic/claude-3.7-sonnet","name":"Anthropic: Claude 3.7 Sonnet","created_by":"anthropic","source":"official","last_updated":"2026-05-06","family":"claude-sonnet","description":"Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities.","status":"deprecated","deprecation_date":"2026-05-11","context_window":200000,"max_output_tokens":64000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"pricing":{"input":3,"output":15,"cached_input":0.3},"model_type":"chat","release_date":"2025-02-24","tagline":"Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities.","tools":["function_calling"]},{"id":"anthropic/claude-fable-5","name":"Anthropic: Claude Fable 5","created_by":"anthropic","source":"official","family":"claude-fable","description":"Claude Fable 5 is a Mythos-class model from Anthropic, built for autonomous knowledge work and coding.","release_date":"2026-06-09","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"Claude Fable 5 is a Mythos-class model from Anthropic, built for autonomous knowledge work and coding.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":10,"output":50,"cached_input":1},"tools":["function_calling"],"last_updated":"2026-06-18","license":"proprietary","open_weight":false},{"id":"anthropic/claude-haiku-4.5","name":"Anthropic: Claude Haiku 4.5","created_by":"anthropic","source":"official","last_updated":"2026-05-14","family":"claude-haiku","description":"Claude Haiku 4.5 is Anthropic’s fastest and most efficient model, delivering near-frontier intelligence at a fraction of the cost and latency of larger Claude models.","context_window":200000,"max_output_tokens":64000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":1,"output":5,"cached_input":0.1},"model_type":"chat","release_date":"2025-10-15","tagline":"Claude Haiku 4.5 is Anthropic’s fastest and most efficient model, delivering near-frontier intelligence at a fraction of the cost and latency of larger Claude models.","tools":["function_calling"]},{"id":"anthropic/claude-opus-4.1","name":"Anthropic: Claude Opus 4.1","created_by":"anthropic","source":"official","last_updated":"2026-03-24","family":"claude-opus","description":"Claude Opus 4.1 is an updated version of Anthropic’s flagship model, offering improved performance in coding, reasoning, and agentic tasks.","context_window":200000,"max_output_tokens":32000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":15,"output":75,"cached_input":1.5},"model_type":"chat","release_date":"2025-08-05","tagline":"Claude Opus 4.1 is an updated version of Anthropic’s flagship model, offering improved performance in coding, reasoning, and agentic tasks.","tools":["function_calling"]},{"id":"anthropic/claude-opus-4.5","name":"Anthropic: Claude Opus 4.5","created_by":"anthropic","source":"official","last_updated":"2026-03-24","family":"claude-opus","description":"Claude Opus 4.5 is Anthropic’s frontier reasoning model optimized for complex software engineering, agentic workflows, and long-horizon computer use.","context_window":200000,"max_output_tokens":64000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":5,"output":25,"cached_input":0.5},"model_type":"chat","release_date":"2025-11-24","tagline":"Claude Opus 4.5 is Anthropic’s frontier reasoning model optimized for complex software engineering, agentic workflows, and long-horizon computer use.","tools":["function_calling"]},{"id":"anthropic/claude-opus-4.6-fast","name":"Anthropic: Claude Opus 4.6 (Fast)","created_by":"anthropic","source":"official","family":"claude-opus","description":"Fast-mode variant of [Opus 4.6](/anthropic/claude-opus-4.6) - identical capabilities with higher output speed at premium 6x pricing.","release_date":"2026-04-07","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"Fast-mode variant of [Opus 4.6](/anthropic/claude-opus-4.6) - identical capabilities with higher output speed at premium 6x pricing.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":30,"output":150,"cached_input":3},"tools":["function_calling"],"last_updated":"2026-05-29","status":"deprecated","deprecation_date":"2026-06-29"},{"id":"anthropic/claude-opus-4.6","name":"Anthropic: Claude Opus 4.6","created_by":"anthropic","source":"official","last_updated":"2026-03-24","family":"claude-opus","description":"Opus 4.6 is Anthropic’s strongest model for coding and long-running professional tasks.","context_window":1000000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":5,"output":25,"cached_input":0.5},"model_type":"chat","release_date":"2026-02-04","tagline":"Opus 4.6 is Anthropic’s strongest model for coding and long-running professional tasks.","tools":["function_calling"]},{"id":"anthropic/claude-opus-4.7-fast","name":"Anthropic: Claude Opus 4.7 (Fast)","created_by":"anthropic","source":"official","family":"claude-opus","description":"Fast-mode variant of [Opus 4.7](/anthropic/claude-opus-4.7) - identical capabilities with higher output speed at premium 6x pricing.","release_date":"2026-05-12","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"Fast-mode variant of [Opus 4.7](/anthropic/claude-opus-4.7) - identical capabilities with higher output speed at premium 6x pricing.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":30,"output":150,"cached_input":3},"tools":["function_calling"],"last_updated":"2026-05-14"},{"id":"anthropic/claude-opus-4.7","name":"Anthropic: Claude Opus 4.7","created_by":"anthropic","source":"official","family":"claude-opus","description":"Opus 4.7 is the next generation of Anthropic's Opus family, built for long-running, asynchronous agents.","release_date":"2026-04-16","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"Opus 4.7 is the next generation of Anthropic's Opus family, built for long-running, asynchronous agents.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5,"output":25,"cached_input":0.5},"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"anthropic/claude-opus-4.8-fast","name":"Anthropic: Claude Opus 4.8 (Fast)","created_by":"anthropic","source":"official","family":"claude-opus","description":"Fast-mode variant of [Opus 4.8](/anthropic/claude-opus-4.8) - identical capabilities with higher output speed at 2x pricing relative to regular Opus 4.8.","release_date":"2026-05-27","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"Fast-mode variant of [Opus 4.8](/anthropic/claude-opus-4.8) - identical capabilities with higher output speed at 2x pricing relative to regular Opus 4.8.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":10,"output":50,"cached_input":1},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"anthropic/claude-opus-4.8","name":"Anthropic: Claude Opus 4.8","created_by":"anthropic","source":"official","family":"claude-opus","description":"Claude Opus 4.8 is Anthropic's most capable generally available model in the Opus family.","release_date":"2026-05-27","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"Claude Opus 4.8 is Anthropic's most capable generally available model in the Opus family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5,"output":25,"cached_input":0.5},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"anthropic/claude-opus-4","name":"Anthropic: Claude Opus 4","created_by":"anthropic","source":"official","last_updated":"2026-03-23","family":"claude-opus","description":"Claude Opus 4 is benchmarked as the world’s best coding model, at time of release, bringing sustained performance on complex, long-running tasks and agent workflows.","context_window":200000,"max_output_tokens":32000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"pricing":{"input":15,"output":75,"cached_input":1.5},"model_type":"chat","release_date":"2025-05-22","tagline":"Claude Opus 4 is benchmarked as the world’s best coding model, at time of release, bringing sustained performance on complex, long-running tasks and agent workflows.","tools":["function_calling"]},{"id":"anthropic/claude-sonnet-4.5","name":"Anthropic: Claude Sonnet 4.5","created_by":"anthropic","source":"official","last_updated":"2026-03-24","family":"claude-sonnet","description":"Claude Sonnet 4.5 is Anthropic’s most advanced Sonnet model to date, optimized for real-world agents and coding workflows.","context_window":1000000,"max_output_tokens":64000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":3,"output":15,"cached_input":0.3},"model_type":"chat","release_date":"2025-09-29","tagline":"Claude Sonnet 4.5 is Anthropic’s most advanced Sonnet model to date, optimized for real-world agents and coding workflows.","tools":["function_calling"]},{"id":"anthropic/claude-sonnet-4.6","name":"Anthropic: Claude Sonnet 4.6","created_by":"anthropic","source":"official","last_updated":"2026-03-24","family":"claude-sonnet","description":"Sonnet 4.6 is Anthropic's most capable Sonnet-class model yet, with frontier performance across coding, agents, and professional work.","context_window":1000000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":3,"output":15,"cached_input":0.3},"model_type":"chat","release_date":"2026-02-17","tagline":"Sonnet 4.6 is Anthropic's most capable Sonnet-class model yet, with frontier performance across coding, agents, and professional work.","tools":["function_calling"]},{"id":"anthropic/claude-sonnet-4","name":"Anthropic: Claude Sonnet 4","created_by":"anthropic","source":"official","last_updated":"2026-04-12","family":"claude-sonnet","description":"Claude Sonnet 4 significantly enhances the capabilities of its predecessor, Sonnet 3.7, excelling in both coding and reasoning tasks with improved precision and controllability.","context_window":1000000,"max_output_tokens":64000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"pricing":{"input":3,"output":15,"cached_input":0.3},"model_type":"chat","release_date":"2025-05-22","tagline":"Claude Sonnet 4 significantly enhances the capabilities of its predecessor, Sonnet 3.7, excelling in both coding and reasoning tasks with improved precision and controllability.","tools":["function_calling"]},{"id":"arcee-ai/coder-large","name":"Arcee AI: Coder Large","created_by":"arcee-ai","source":"official","last_updated":"2026-04-07","description":"Coder‑Large is a 32 B‑parameter offspring of Qwen 2.5‑Instruct that has been further trained on permissively‑licensed GitHub, CodeSearchNet and synthetic bug‑fix corpora.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.5,"output":0.8},"release_date":"2025-05-05","tagline":"Coder‑Large is a 32 B‑parameter offspring of Qwen 2.5‑Instruct that has been further trained on permissively‑licensed GitHub, CodeSearchNet and synthetic bug‑fix corpora."},{"id":"arcee-ai/maestro-reasoning","name":"Arcee AI: Maestro Reasoning","created_by":"arcee-ai","source":"official","last_updated":"2026-04-07","description":"Maestro Reasoning is Arcee's flagship analysis model: a 32 B‑parameter derivative of Qwen 2.5‑32 B tuned with DPO and chain‑of‑thought RL for step‑by‑step logic.","context_window":131072,"max_output_tokens":32000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.9,"output":3.3},"model_type":"reasoning","release_date":"2025-05-05","tagline":"Maestro Reasoning is Arcee's flagship analysis model: a 32 B‑parameter derivative of Qwen 2.5‑32 B tuned with DPO and chain‑of‑thought RL for step‑by‑step logic."},{"id":"arcee-ai/spotlight","name":"Arcee AI: Spotlight","created_by":"arcee-ai","source":"official","last_updated":"2026-04-07","description":"Spotlight is a 7‑billion‑parameter vision‑language model derived from Qwen 2.5‑VL and fine‑tuned by Arcee AI for tight image‑text grounding tasks.","context_window":131072,"max_output_tokens":65537,"modalities":{"input":["image","text"],"output":["text"]},"pricing":{"input":0.18,"output":0.18},"release_date":"2025-05-05","tagline":"Spotlight is a 7‑billion‑parameter vision‑language model derived from Qwen 2.5‑VL and fine‑tuned by Arcee AI for tight image‑text grounding tasks."},{"id":"arcee-ai/trinity-large-preview:free","name":"Arcee AI: Trinity Large Preview (free)","created_by":"arcee-ai","source":"official","last_updated":"2026-04-10","description":"Trinity-Large-Preview is a frontier-scale open-weight language model from Arcee, built as a 400B-parameter sparse Mixture-of-Experts with 13B active parameters per token using 4-of-256 expert routing.","context_window":131000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"release_date":"2026-01-27","tagline":"Trinity-Large-Preview is a frontier-scale open-weight language model from Arcee, built as a 400B-parameter sparse Mixture-of-Experts with 13B active parameters per token using 4-of-256 expert routing.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-04-22"},{"id":"arcee-ai/trinity-large-preview","name":"Arcee AI: Trinity Large Preview","created_by":"arcee-ai","source":"official","description":"Trinity-Large-Preview is a frontier-scale open-weight language model from Arcee, built as a 400B-parameter sparse Mixture-of-Experts with 13B active parameters per token using 4-of-256 expert routing.","release_date":"2026-01-27","context_window":131000,"tagline":"Trinity-Large-Preview is a frontier-scale open-weight language model from Arcee, built as a 400B-parameter sparse Mixture-of-Experts with 13B active parameters per token using 4-of-256 expert routing.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.15,"output":0.45},"tools":["function_calling"],"last_updated":"2026-04-24"},{"id":"arcee-ai/trinity-large-thinking:free","name":"Arcee AI: Trinity Large Thinking (free)","created_by":"arcee-ai","source":"official","description":"Trinity Large Thinking is a powerful open source reasoning model from the team at Arcee AI.","release_date":"2026-04-01","context_window":262144,"max_output_tokens":80000,"tagline":"Trinity Large Thinking is a powerful open source reasoning model from the team at Arcee AI.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-14"},{"id":"arcee-ai/trinity-large-thinking","name":"Arcee AI: Trinity Large Thinking","created_by":"arcee-ai","source":"official","description":"Trinity Large Thinking is a powerful open source reasoning model from the team at Arcee AI.","release_date":"2026-04-01","context_window":262144,"max_output_tokens":80000,"tagline":"Trinity Large Thinking is a powerful open source reasoning model from the team at Arcee AI.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.25,"output":0.8,"cached_input":0.06},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"arcee-ai/trinity-mini:free","name":"Arcee AI: Trinity Mini (free)","created_by":"arcee-ai","source":"official","last_updated":"2026-04-03","description":"Trinity Mini is a 26B-parameter (3B active) sparse mixture-of-experts language model featuring 128 experts with 8 active per token.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"release_date":"2025-12-01","tagline":"Trinity Mini is a 26B-parameter (3B active) sparse mixture-of-experts language model featuring 128 experts with 8 active per token.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-04-10"},{"id":"arcee-ai/trinity-mini","name":"Arcee AI: Trinity Mini","created_by":"arcee-ai","source":"official","last_updated":"2026-03-24","description":"Trinity Mini is a 26B-parameter (3B active) sparse mixture-of-experts language model featuring 128 experts with 8 active per token.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.045,"output":0.15},"release_date":"2025-12-01","tagline":"Trinity Mini is a 26B-parameter (3B active) sparse mixture-of-experts language model featuring 128 experts with 8 active per token.","tools":["function_calling"]},{"id":"arcee-ai/virtuoso-large","name":"Arcee AI: Virtuoso Large","created_by":"arcee-ai","source":"official","last_updated":"2026-04-07","description":"Virtuoso‑Large is Arcee's top‑tier general‑purpose LLM at 72 B parameters, tuned to tackle cross‑domain reasoning, creative writing and enterprise QA.","context_window":131072,"max_output_tokens":64000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":0.75,"output":1.2},"release_date":"2025-05-05","tagline":"Virtuoso‑Large is Arcee's top‑tier general‑purpose LLM at 72 B parameters, tuned to tackle cross‑domain reasoning, creative writing and enterprise QA.","tools":["function_calling"]},{"id":"baidu/cobuddy:free","name":"Baidu Qianfan: CoBuddy (free)","created_by":"baidu","source":"official","description":"CoBuddy is a code generation model from Baidu, optimized for coding tasks and AI Agent workflows.","release_date":"2026-05-06","context_window":131072,"max_output_tokens":65536,"tagline":"CoBuddy is a code generation model from Baidu, optimized for coding tasks and AI Agent workflows.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-06"},{"id":"baidu/ernie-4.5-21b-a3b-thinking","name":"Baidu: ERNIE 4.5 21B A3B Thinking","created_by":"baidu","source":"official","last_updated":"2026-03-23","description":"ERNIE-4.5-21B-A3B-Thinking is Baidu's upgraded lightweight MoE model, refined to boost reasoning depth and quality for top-tier performance in logical puzzles, math, science, coding, text generation, ","context_window":131072,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"reasoning":true},"pricing":{"input":0.07,"output":0.28},"parameters":21,"active_parameters":3,"release_date":"2025-10-09","tagline":"ERNIE-4.5-21B-A3B-Thinking is Baidu's upgraded lightweight MoE model, refined to boost reasoning depth and quality for top-tier performance in logical puzzles, math, science, coding, text generation, "},{"id":"baidu/ernie-4.5-21b-a3b","name":"Baidu: ERNIE 4.5 21B A3B","created_by":"baidu","source":"official","last_updated":"2026-05-17","description":"A sophisticated text-based Mixture-of-Experts (MoE) model featuring 21B total parameters with 3B activated per token, delivering exceptional multimodal understanding and generation through heterogeneous MoE structures and modality-isolated routing.","context_window":131072,"max_output_tokens":8000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":0.07,"output":0.28},"parameters":21,"active_parameters":3,"release_date":"2025-08-12","tagline":"A sophisticated text-based Mixture-of-Experts (MoE) model featuring 21B total parameters with 3B activated per token, delivering exceptional multimodal understanding and generation through heterogeneo","tools":["function_calling"]},{"id":"baidu/ernie-4.5-300b-a47b","name":"Baidu: ERNIE 4.5 300B A47B ","created_by":"baidu","source":"official","last_updated":"2026-05-17","description":"ERNIE-4.5-300B-A47B is a 300B parameter Mixture-of-Experts (MoE) language model developed by Baidu as part of the ERNIE 4.5 series.","context_window":131072,"max_output_tokens":12000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.28,"output":1.1},"parameters":300,"active_parameters":47,"release_date":"2025-06-30","tagline":"ERNIE-4.5-300B-A47B is a 300B parameter Mixture-of-Experts (MoE) language model developed by Baidu as part of the ERNIE 4.5 series."},{"id":"baidu/ernie-4.5-vl-28b-a3b","name":"Baidu: ERNIE 4.5 VL 28B A3B","created_by":"baidu","source":"official","last_updated":"2026-05-17","description":"A powerful multimodal Mixture-of-Experts chat model featuring 28B total parameters with 3B activated per token, delivering exceptional text and vision understanding through its innovative heterogeneou","context_window":131072,"max_output_tokens":8000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"pricing":{"input":0.14,"output":0.56},"parameters":28,"active_parameters":3,"release_date":"2025-08-12","tagline":"A powerful multimodal Mixture-of-Experts chat model featuring 28B total parameters with 3B activated per token, delivering exceptional text and vision understanding through its innovative heterogeneou","tools":["function_calling"]},{"id":"baidu/ernie-4.5-vl-424b-a47b","name":"Baidu: ERNIE 4.5 VL 424B A47B ","created_by":"baidu","source":"official","last_updated":"2026-05-17","description":"ERNIE-4.5-VL-424B-A47B is a multimodal Mixture-of-Experts (MoE) model from Baidu’s ERNIE 4.5 series, featuring 424B total parameters with 47B active per token.","context_window":131072,"max_output_tokens":16000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"reasoning":true},"pricing":{"input":0.42,"output":1.25},"parameters":424,"active_parameters":47,"release_date":"2025-06-30","tagline":"ERNIE-4.5-VL-424B-A47B is a multimodal Mixture-of-Experts (MoE) model from Baidu’s ERNIE 4.5 series, featuring 424B total parameters with 47B active per token."},{"id":"baidu/qianfan-ocr-fast:free","name":"Baidu: Qianfan-OCR-Fast (free)","created_by":"baidu","source":"official","description":"Qianfan-OCR-Fast is a domain-specific multimodal large model purpose-built for OCR.","release_date":"2026-04-20","context_window":65536,"max_output_tokens":28672,"tagline":"Qianfan-OCR-Fast is a domain-specific multimodal large model purpose-built for OCR.","capabilities":{"reasoning":true},"modalities":{"input":["image","text"],"output":["text"]},"last_updated":"2026-04-24"},{"id":"baidu/qianfan-ocr-fast","name":"Baidu: Qianfan-OCR-Fast","created_by":"baidu","source":"official","description":"Qianfan-OCR-Fast is a domain-specific multimodal large model purpose-built for OCR.","release_date":"2026-04-20","context_window":65536,"max_output_tokens":28672,"tagline":"Qianfan-OCR-Fast is a domain-specific multimodal large model purpose-built for OCR.","capabilities":{"reasoning":true},"modalities":{"input":["image","text"],"output":["text"]},"pricing":{"input":0.68,"output":2.81},"last_updated":"2026-05-23","status":"deprecated","deprecation_date":"2026-05-28"},{"id":"bytedance-seed/seed-1.6-flash","name":"ByteDance Seed: Seed 1.6 Flash","created_by":"bytedance-seed","source":"official","last_updated":"2026-03-24","description":"Seed 1.6 Flash is an ultra-fast multimodal deep thinking model by ByteDance Seed, supporting both text and visual understanding.","context_window":262144,"max_output_tokens":32768,"modalities":{"input":["image","text","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.075,"output":0.3},"release_date":"2025-12-23","tagline":"Seed 1.6 Flash is an ultra-fast multimodal deep thinking model by ByteDance Seed, supporting both text and visual understanding.","tools":["function_calling"]},{"id":"bytedance-seed/seed-1.6","name":"ByteDance Seed: Seed 1.6","created_by":"bytedance-seed","source":"official","last_updated":"2026-03-24","description":"Seed 1.6 is a general-purpose model released by the ByteDance Seed team.","context_window":262144,"max_output_tokens":32768,"modalities":{"input":["image","text","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.25,"output":2},"release_date":"2025-12-23","tagline":"Seed 1.6 is a general-purpose model released by the ByteDance Seed team.","tools":["function_calling"]},{"id":"bytedance-seed/seed-2.0-lite","name":"ByteDance Seed: Seed-2.0-Lite","created_by":"bytedance-seed","source":"official","last_updated":"2026-04-07","description":"Seed-2.0-Lite is a versatile, cost‑efficient enterprise workhorse that delivers strong multimodal and agent capabilities while offering noticeably lower latency, making it a practical default choice f","context_window":262144,"max_output_tokens":131072,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.25,"output":2},"release_date":"2026-03-10","tagline":"Seed-2.0-Lite is a versatile, cost‑efficient enterprise workhorse that delivers strong multimodal and agent capabilities while offering noticeably lower latency, making it a practical default choice f","tools":["function_calling"]},{"id":"bytedance-seed/seed-2.0-mini","name":"ByteDance Seed: Seed-2.0-Mini","created_by":"bytedance-seed","source":"official","last_updated":"2026-03-24","description":"Seed-2.0-mini targets latency-sensitive, high-concurrency, and cost-sensitive scenarios, emphasizing fast response and flexible inference deployment.","context_window":262144,"max_output_tokens":131072,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.1,"output":0.4},"release_date":"2026-02-26","tagline":"Seed-2.0-mini targets latency-sensitive, high-concurrency, and cost-sensitive scenarios, emphasizing fast response and flexible inference deployment.","tools":["function_calling"]},{"id":"bytedance/ui-tars-1.5-7b","name":"ByteDance: UI-TARS 7B ","created_by":"bytedance","source":"official","last_updated":"2026-06-18","description":"UI-TARS-1.5 is a multimodal vision-language agent optimized for GUI-based environments, including desktop interfaces, web browsers, mobile systems, and games.","context_window":128000,"max_output_tokens":2048,"modalities":{"input":["image","text"],"output":["text"]},"pricing":{"input":0.1,"output":0.2,"cached_input":0.1},"parameters":7,"release_date":"2025-07-22","tagline":"UI-TARS-1.5 is a multimodal vision-language agent optimized for GUI-based environments, including desktop interfaces, web browsers, mobile systems, and games.","capabilities":{"structured_output":true,"json_mode":true}},{"id":"cognitivecomputations/dolphin-mistral-24b-venice-edition:free","name":"Venice: Uncensored (free)","created_by":"cognitivecomputations","source":"official","last_updated":"2026-03-24","description":"Venice Uncensored Dolphin Mistral 24B Venice Edition is a fine-tuned variant of Mistral-Small-24B-Instruct-2501, developed by dphn.ai in collaboration with Venice.ai.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"parameters":24,"release_date":"2025-07-09","tagline":"Venice Uncensored Dolphin Mistral 24B Venice Edition is a fine-tuned variant of Mistral-Small-24B-Instruct-2501, developed by dphn.ai in collaboration with Venice.ai."},{"id":"cohere/command-a","name":"Cohere: Command A","created_by":"cohere","source":"official","last_updated":"2026-03-24","description":"Command A is an open-weights 111B parameter model with a 256k context window focused on delivering great performance across agentic, multilingual, and coding use cases.","context_window":256000,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":2.5,"output":10},"family":"command-a","model_type":"chat","release_date":"2025-03-13","tagline":"Command A is an open-weights 111B parameter model with a 256k context window focused on delivering great performance across agentic, multilingual, and coding use cases."},{"id":"cohere/command-r-08-2024","name":"Cohere: Command R (08-2024)","created_by":"cohere","source":"official","last_updated":"2026-03-24","description":"command-r-08-2024 is an update of the [Command R](/models/cohere/command-r) with improved performance for multilingual retrieval-augmented generation (RAG) and tool use.","context_window":128000,"max_output_tokens":4000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.15,"output":0.6},"family":"command-r","model_type":"chat","release_date":"2024-08-30","tagline":"command-r-08-2024 is an update of the [Command R](/models/cohere/command-r) with improved performance for multilingual retrieval-augmented generation (RAG) and tool use.","tools":["function_calling"],"license":"cc-by-nc-4.0","open_weight":true},{"id":"cohere/command-r-plus-08-2024","name":"Cohere: Command R+ (08-2024)","created_by":"cohere","source":"official","last_updated":"2026-04-07","description":"command-r-plus-08-2024 is an update of the [Command R+](/models/cohere/command-r-plus) with roughly 50% higher throughput and 25% lower latencies as compared to the previous Command R+ version, while ","context_window":128000,"max_output_tokens":4000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":2.5,"output":10},"family":"command-r-plus","model_type":"chat","release_date":"2024-08-30","tagline":"command-r-plus-08-2024 is an update of the [Command R+](/models/cohere/command-r-plus) with roughly 50% higher throughput and 25% lower latencies as compared to the previous Command R+ version, while ","tools":["function_calling"],"license":"cc-by-nc-4.0","open_weight":true},{"id":"cohere/command-r7b-12-2024","name":"Cohere: Command R7B (12-2024)","created_by":"cohere","source":"official","last_updated":"2026-03-24","description":"Command R7B (12-2024) is a small, fast update of the Command R+ model, delivered in December 2024.","context_window":128000,"max_output_tokens":4000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"tool_call":true,"reasoning":true,"fine_tuning":true},"pricing":{"input":0.038,"output":0.15},"family":"command-r","model_type":"chat","release_date":"2024-12-14","tagline":"Command R7B (12-2024) is a small, fast update of the Command R+ model, delivered in December 2024.","license":"cc-by-nc-4.0","open_weight":true},{"id":"cohere/north-mini-code:free","name":"Cohere: North Mini Code (free)","created_by":"cohere","source":"official","description":"North Mini Code is Cohere's first agentic coding model and the debut of its North family.","release_date":"2026-06-17","context_window":256000,"max_output_tokens":64000,"tagline":"North Mini Code is Cohere's first agentic coding model and the debut of its North family.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-18"},{"id":"deepcogito/cogito-v2.1-671b","name":"Deep Cogito: Cogito v2.1 671B","created_by":"deepcogito","source":"official","last_updated":"2026-03-24","description":"Cogito v2.1 671B MoE represents one of the strongest open models globally, matching performance of frontier closed and open models.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":1.25,"output":1.25},"parameters":671,"release_date":"2025-11-13","tagline":"Cogito v2.1 671B MoE represents one of the strongest open models globally, matching performance of frontier closed and open models.","model_type":"chat"},{"id":"deepseek/deepseek-chat-v3-0324","name":"DeepSeek: DeepSeek V3 0324","created_by":"deepseek","source":"official","last_updated":"2026-04-25","family":"deepseek-chat","description":"DeepSeek V3, a 685B-parameter, mixture-of-experts model, is the latest iteration of the flagship chat model family from the DeepSeek team.","context_window":163840,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.2,"output":0.77,"cached_input":0.135},"release_date":"2025-03-24","tagline":"DeepSeek V3, a 685B-parameter, mixture-of-experts model, is the latest iteration of the flagship chat model family from the DeepSeek team.","tools":["function_calling"],"model_type":"chat","max_output_tokens":16384},{"id":"deepseek/deepseek-chat-v3.1","name":"DeepSeek: DeepSeek V3.1","created_by":"deepseek","source":"official","last_updated":"2026-05-14","family":"deepseek-chat","description":"DeepSeek-V3.1 is a large hybrid reasoning model (671B parameters, 37B active) that supports both thinking and non-thinking modes via prompt templates.","context_window":163840,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.21,"output":0.79,"cached_input":0.13},"release_date":"2025-08-21","tagline":"DeepSeek-V3.1 is a large hybrid reasoning model (671B parameters, 37B active) that supports both thinking and non-thinking modes via prompt templates.","tools":["function_calling"],"model_type":"chat"},{"id":"deepseek/deepseek-chat","name":"DeepSeek: DeepSeek V3","created_by":"deepseek","source":"official","last_updated":"2026-06-02","family":"deepseek-chat","description":"DeepSeek-V3 is the latest model from the DeepSeek team, building upon the instruction following and coding abilities of the previous versions.","context_window":131072,"max_output_tokens":16000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.2,"output":0.8},"release_date":"2024-12-26","tagline":"DeepSeek-V3 is the latest model from the DeepSeek team, building upon the instruction following and coding abilities of the previous versions.","tools":["function_calling"],"model_type":"chat","license":"mit","open_weight":true},{"id":"deepseek/deepseek-r1-0528","name":"DeepSeek: R1 0528","created_by":"deepseek","source":"official","last_updated":"2026-04-25","family":"deepseek-r1","description":"May 28th update to the [original DeepSeek R1](/deepseek/deepseek-r1) Performance on par with [OpenAI o1](/openai/o1), but open-sourced and with fully open reasoning tokens.","context_window":163840,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.5,"output":2.15,"cached_input":0.35},"model_type":"reasoning","release_date":"2025-05-28","tagline":"May 28th update to the [original DeepSeek R1](/deepseek/deepseek-r1) Performance on par with [OpenAI o1](/openai/o1), but open-sourced and with fully open reasoning tokens.","tools":["function_calling"]},{"id":"deepseek/deepseek-r1-distill-llama-70b","name":"DeepSeek: R1 Distill Llama 70B","created_by":"deepseek","source":"official","last_updated":"2026-06-18","family":"deepseek-r1","description":"DeepSeek R1 Distill Llama 70B is a distilled large language model based on [Llama-3.3-70B-Instruct](/meta-llama/llama-3.3-70b-instruct), using outputs from [DeepSeek R1](/deepseek/deepseek-r1).","context_window":128000,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.8,"output":0.8},"model_type":"reasoning","parameters":70,"release_date":"2025-01-23","tagline":"DeepSeek R1 Distill Llama 70B is a distilled large language model based on [Llama-3.3-70B-Instruct](/meta-llama/llama-3.3-70b-instruct), using outputs from [DeepSeek R1](/deepseek/deepseek-r1).","status":"deprecated","deprecation_date":"2026-06-11"},{"id":"deepseek/deepseek-r1-distill-qwen-32b","name":"DeepSeek: R1 Distill Qwen 32B","created_by":"deepseek","source":"official","last_updated":"2026-05-17","family":"deepseek-r1","description":"DeepSeek R1 Distill Qwen 32B is a distilled large language model based on [Qwen 2.5 32B](https://huggingface.co/Qwen/Qwen2.5-32B), using outputs from [DeepSeek R1](/deepseek/deepseek-r1).","context_window":128000,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.29,"output":0.29},"model_type":"reasoning","parameters":32,"release_date":"2025-01-29","tagline":"DeepSeek R1 Distill Qwen 32B is a distilled large language model based on [Qwen 2.5 32B](https://huggingface.co/Qwen/Qwen2.5-32B), using outputs from [DeepSeek R1](/deepseek/deepseek-r1)."},{"id":"deepseek/deepseek-r1","name":"DeepSeek: R1","created_by":"deepseek","source":"official","last_updated":"2026-05-17","family":"deepseek-r1","description":"DeepSeek R1 is here: Performance on par with [OpenAI o1](/openai/o1), but open-sourced and with fully open reasoning tokens.","context_window":163840,"max_output_tokens":16000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.7,"output":2.5},"model_type":"reasoning","release_date":"2025-01-20","tagline":"DeepSeek R1 is here: Performance on par with [OpenAI o1](/openai/o1), but open-sourced and with fully open reasoning tokens.","tools":["function_calling"]},{"id":"deepseek/deepseek-v3.1-terminus","name":"DeepSeek: DeepSeek V3.1 Terminus","created_by":"deepseek","source":"official","last_updated":"2026-05-06","family":"deepseek","description":"DeepSeek-V3.1 Terminus is an update to [DeepSeek V3.1](/deepseek/deepseek-chat-v3.1) that maintains the model's original capabilities while addressing issues reported by users, including language cons","context_window":163840,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.27,"output":0.95,"cached_input":0.13},"release_date":"2025-09-22","tagline":"DeepSeek-V3.1 Terminus is an update to [DeepSeek V3.1](/deepseek/deepseek-chat-v3.1) that maintains the model's original capabilities while addressing issues reported by users, including language cons","tools":["function_calling"],"model_type":"chat"},{"id":"deepseek/deepseek-v3.2-exp","name":"DeepSeek: DeepSeek V3.2 Exp","created_by":"deepseek","source":"official","last_updated":"2026-03-24","family":"deepseek","description":"DeepSeek-V3.2-Exp is an experimental large language model released by DeepSeek as an intermediate step between V3.1 and future architectures.","context_window":163840,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.27,"output":0.41},"release_date":"2025-09-29","tagline":"DeepSeek-V3.2-Exp is an experimental large language model released by DeepSeek as an intermediate step between V3.1 and future architectures.","tools":["function_calling"],"model_type":"chat"},{"id":"deepseek/deepseek-v3.2-speciale","name":"DeepSeek: DeepSeek V3.2 Speciale","created_by":"deepseek","source":"official","last_updated":"2026-05-07","family":"deepseek","description":"DeepSeek-V3.2-Speciale is a high-compute variant of DeepSeek-V3.2 optimized for maximum reasoning and agentic performance.","context_window":163840,"max_output_tokens":163840,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.287,"output":0.431,"cached_input":0.058},"release_date":"2025-12-01","tagline":"DeepSeek-V3.2-Speciale is a high-compute variant of DeepSeek-V3.2 optimized for maximum reasoning and agentic performance.","model_type":"chat"},{"id":"deepseek/deepseek-v3.2","name":"DeepSeek: DeepSeek V3.2","created_by":"deepseek","source":"official","last_updated":"2026-06-29","family":"deepseek","description":"DeepSeek-V3.2 is a large language model designed to harmonize high computational efficiency with strong reasoning and agentic tool-use performance.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.229,"output":0.343,"cached_input":0.023},"release_date":"2025-12-01","tagline":"DeepSeek-V3.2 is a large language model designed to harmonize high computational efficiency with strong reasoning and agentic tool-use performance.","tools":["function_calling"],"model_type":"chat","max_output_tokens":64000},{"id":"deepseek/deepseek-v4-flash:free","name":"DeepSeek: DeepSeek V4 Flash (free)","created_by":"deepseek","source":"official","family":"deepseek","description":"DeepSeek V4 Flash is an efficiency-optimized Mixture-of-Experts model from DeepSeek with 284B total parameters and 13B activated parameters, supporting a 1M-token context window.","release_date":"2026-04-24","context_window":1048576,"max_output_tokens":384000,"model_type":"chat","tagline":"DeepSeek V4 Flash is an efficiency-optimized Mixture-of-Experts model from DeepSeek with 284B total parameters and 13B activated parameters, supporting a 1M-token context window.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-17"},{"id":"deepseek/deepseek-v4-flash","name":"DeepSeek: DeepSeek V4 Flash","created_by":"deepseek","source":"official","family":"deepseek","description":"DeepSeek V4 Flash is an efficiency-optimized Mixture-of-Experts model from DeepSeek with 284B total parameters and 13B activated parameters, supporting a 1M-token context window.","release_date":"2026-04-24","context_window":1048576,"max_output_tokens":65536,"model_type":"chat","tagline":"DeepSeek V4 Flash is an efficiency-optimized Mixture-of-Experts model from DeepSeek with 284B total parameters and 13B activated parameters, supporting a 1M-token context window.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.09,"output":0.18,"cached_input":0.02},"tools":["function_calling"],"last_updated":"2026-06-18","license":"mit","open_weight":true},{"id":"deepseek/deepseek-v4-pro","name":"DeepSeek: DeepSeek V4 Pro","created_by":"deepseek","source":"official","family":"deepseek","description":"DeepSeek V4 Pro is a large-scale Mixture-of-Experts model from DeepSeek with 1.6T total parameters and 49B activated parameters, supporting a 1M-token context window.","release_date":"2026-04-24","context_window":1048576,"max_output_tokens":384000,"model_type":"chat","tagline":"DeepSeek V4 Pro is a large-scale Mixture-of-Experts model from DeepSeek with 1.6T total parameters and 49B activated parameters, supporting a 1M-token context window.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.435,"output":0.87,"cached_input":0.004},"tools":["function_calling"],"last_updated":"2026-04-26","license":"mit","open_weight":true},{"id":"eleutherai/llemma_7b","name":"EleutherAI: Llemma 7b","created_by":"eleutherai","source":"official","last_updated":"2026-03-23","description":"Llemma 7B is a language model for mathematics.","context_window":4096,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.8,"output":1.2},"parameters":7,"release_date":"2025-04-14","tagline":"Llemma 7B is a language model for mathematics."},{"id":"essentialai/rnj-1-instruct","name":"EssentialAI: Rnj 1 Instruct","created_by":"essentialai","source":"official","last_updated":"2026-03-24","description":"Rnj-1 is an 8B-parameter, dense, open-weight model family developed by Essential AI and trained from scratch with a focus on programming, math, and scientific reasoning.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.15,"output":0.15},"release_date":"2025-12-07","tagline":"Rnj-1 is an 8B-parameter, dense, open-weight model family developed by Essential AI and trained from scratch with a focus on programming, math, and scientific reasoning.","tools":["function_calling"],"model_type":"chat"},{"id":"google/gemini-2.0-flash-001","name":"Google: Gemini 2.0 Flash","created_by":"google","source":"official","last_updated":"2026-05-23","family":"gemini-2.0","description":"Gemini Flash 2.0 offers a significantly faster time to first token (TTFT) compared to [Gemini Flash 1.5](/google/gemini-flash-1.5), while maintaining quality on par with larger models like [Gemini Pro 1.5](/google/gemini-pro-1.5).","status":"deprecated","deprecation_date":"2026-06-01","context_window":1000000,"max_output_tokens":8192,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true},"pricing":{"input":0.1,"output":0.4,"cached_input":0.025},"model_type":"chat","release_date":"2025-02-05","tagline":"Gemini Flash 2.0 offers a significantly faster time to first token (TTFT) compared to [Gemini Flash 1.5](/google/gemini-flash-1.5), while maintaining quality on par with larger models like [Gemini Pro","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"google/gemini-2.0-flash-lite-001","name":"Google: Gemini 2.0 Flash Lite","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.0","description":"Gemini 2.0 Flash Lite offers a significantly faster time to first token (TTFT) compared to [Gemini Flash 1.5](/google/gemini-flash-1.5), while maintaining quality on par with larger models like [Gemin","status":"deprecated","deprecation_date":"2026-06-01","context_window":1048576,"max_output_tokens":8192,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true},"pricing":{"input":0.075,"output":0.3},"model_type":"chat","release_date":"2025-02-25","tagline":"Gemini 2.0 Flash Lite offers a significantly faster time to first token (TTFT) compared to [Gemini Flash 1.5](/google/gemini-flash-1.5), while maintaining quality on par with larger models like [Gemin","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"google/gemini-2.5-flash-image","name":"Google: Nano Banana (Gemini 2.5 Flash Image)","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","description":"Gemini 2.5 Flash Image, a.k.a.","context_window":32768,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["image","text"]},"capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"tool_call":true,"reasoning":true,"batch":true,"vision":true},"pricing":{"input":0.3,"output":2.5,"cached_input":0.03},"model_type":"chat","release_date":"2025-10-07","tagline":"Gemini 2.5 Flash Image, a.k.a.","knowledge_cutoff":"2025-06","license":"proprietary","open_weight":false},{"id":"google/gemini-2.5-flash-lite-preview-09-2025","name":"Google: Gemini 2.5 Flash Lite Preview 09-2025","created_by":"google","source":"official","last_updated":"2026-04-03","family":"gemini-2.5","description":"Gemini 2.5 Flash-Lite is a lightweight reasoning model in the Gemini 2.5 family, optimized for ultra-low latency and cost efficiency.","context_window":1048576,"max_output_tokens":65535,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":0.1,"output":0.4,"cached_input":0.01},"model_type":"chat","release_date":"2025-09-25","tagline":"Gemini 2.5 Flash-Lite is a lightweight reasoning model in the Gemini 2.5 family, optimized for ultra-low latency and cost efficiency.","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-2.5-flash-lite","name":"Google: Gemini 2.5 Flash Lite","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.5","description":"Gemini 2.5 Flash-Lite is a lightweight reasoning model in the Gemini 2.5 family, optimized for ultra-low latency and cost efficiency.","context_window":1048576,"max_output_tokens":65535,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":0.1,"output":0.4,"cached_input":0.01},"model_type":"chat","release_date":"2025-07-22","tagline":"Gemini 2.5 Flash-Lite is a lightweight reasoning model in the Gemini 2.5 family, optimized for ultra-low latency and cost efficiency.","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-2.5-flash","name":"Google: Gemini 2.5 Flash","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.5","description":"Gemini 2.5 Flash is Google's state-of-the-art workhorse model, specifically designed for advanced reasoning, coding, mathematics, and scientific tasks.","context_window":1048576,"max_output_tokens":65535,"modalities":{"input":["image","text","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":0.3,"output":2.5,"cached_input":0.03},"model_type":"chat","release_date":"2025-06-17","tagline":"Gemini 2.5 Flash is Google's state-of-the-art workhorse model, specifically designed for advanced reasoning, coding, mathematics, and scientific tasks.","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-2.5-pro-preview-05-06","name":"Google: Gemini 2.5 Pro Preview 05-06","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.5","description":"Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks.","context_window":1048576,"max_output_tokens":65535,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true},"pricing":{"input":1.25,"output":10,"cached_input":0.125},"model_type":"chat","release_date":"2025-05-07","tagline":"Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks.","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"google/gemini-2.5-pro-preview","name":"Google: Gemini 2.5 Pro Preview 06-05","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.5","description":"Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks.","context_window":1048576,"max_output_tokens":65536,"modalities":{"input":["image","text","audio"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":1.25,"output":10,"cached_input":0.125},"model_type":"chat","release_date":"2025-06-05","tagline":"Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks.","tools":["function_calling"]},{"id":"google/gemini-2.5-pro","name":"Google: Gemini 2.5 Pro","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.5","description":"Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks.","context_window":1048576,"max_output_tokens":65536,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":1.25,"output":10,"cached_input":0.125},"model_type":"chat","release_date":"2025-06-17","tagline":"Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks.","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3-flash-preview","name":"Google: Gemini 3 Flash Preview","created_by":"google","source":"official","last_updated":"2026-06-18","family":"gemini-3","description":"Gemini 3 Flash Preview is a high speed, high value thinking model designed for agentic workflows, multi turn chat, and coding assistance.","context_window":1048576,"max_output_tokens":65535,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":0.5,"output":3,"cached_input":0.05},"model_type":"chat","release_date":"2025-12-17","tagline":"Gemini 3 Flash Preview is a high speed, high value thinking model designed for agentic workflows, multi turn chat, and coding assistance.","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3-pro-image-preview","name":"Google: Nano Banana Pro (Gemini 3 Pro Image Preview)","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-3","description":"Nano Banana Pro is Google’s most advanced image-generation and editing model, built on Gemini 3 Pro.","context_window":65536,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["image","text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"tool_call":true,"batch":true,"vision":true},"pricing":{"input":2,"output":12,"cached_input":0.2},"model_type":"chat","release_date":"2025-11-20","tagline":"Nano Banana Pro is Google’s most advanced image-generation and editing model, built on Gemini 3 Pro.","knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3-pro-image","name":"Google: Nano Banana Pro (Gemini 3 Pro Image)","created_by":"google","source":"official","family":"gemini-3","description":"Nano Banana Pro is Google’s most advanced image-generation and editing model, built on Gemini 3 Pro.","release_date":"2026-06-18","context_window":65536,"max_output_tokens":32768,"model_type":"chat","tagline":"Nano Banana Pro is Google’s most advanced image-generation and editing model, built on Gemini 3 Pro.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"modalities":{"input":["image","text"],"output":["image","text"]},"pricing":{"input":2,"output":12,"cached_input":0.2},"tools":["function_calling"],"last_updated":"2026-06-18","knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3-pro-preview","name":"Google: Gemini 3 Pro Preview","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-3","description":"Gemini 3 Pro is Google’s flagship frontier model for high-precision multimodal reasoning, combining strong performance across text, image, video, audio, and code with a 1M-token context window.","status":"deprecated","deprecation_date":"2026-03-26","context_window":1048576,"max_output_tokens":65536,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":2,"output":12,"cached_input":0.2},"model_type":"chat","release_date":"2025-11-18","tagline":"Gemini 3 Pro is Google’s flagship frontier model for high-precision multimodal reasoning, combining strong performance across text, image, video, audio, and code with a 1M-token context window.","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3.1-flash-image-preview","name":"Google: Nano Banana 2 (Gemini 3.1 Flash Image Preview)","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3.1","description":"Gemini 3.1 Flash Image Preview, a.k.a.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["image","text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"tool_call":true,"batch":true,"vision":true},"pricing":{"input":0.5,"output":3},"model_type":"chat","release_date":"2026-02-26","tagline":"Gemini 3.1 Flash Image Preview, a.k.a.","knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3.1-flash-image","name":"Google: Nano Banana 2 (Gemini 3.1 Flash Image)","created_by":"google","source":"official","family":"gemini-3.1","description":"Gemini 3.1 Flash Image, a.k.a.","release_date":"2026-06-18","context_window":131072,"max_output_tokens":32768,"model_type":"chat","tagline":"Gemini 3.1 Flash Image, a.k.a.","capabilities":{"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"tool_call":true,"batch":true,"vision":true},"modalities":{"input":["image","text"],"output":["image","text"]},"pricing":{"input":0.5,"output":3},"last_updated":"2026-06-29","knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3.1-flash-lite-preview","name":"Google: Gemini 3.1 Flash Lite Preview","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-3.1","description":"Gemini 3.1 Flash Lite Preview is Google's high-efficiency model optimized for high-volume use cases.","context_window":1048576,"max_output_tokens":65536,"modalities":{"input":["text","image","video","audio"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":0.25,"output":1.5,"cached_input":0.025},"model_type":"chat","release_date":"2026-03-03","tagline":"Gemini 3.1 Flash Lite Preview is Google's high-efficiency model optimized for high-volume use cases.","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3.1-flash-lite","name":"Google: Gemini 3.1 Flash Lite","created_by":"google","source":"official","family":"gemini-3.1","description":"Gemini 3.1 Flash Lite is Google’s GA high-efficiency multimodal model optimized for low-latency, high-volume workloads.","release_date":"2026-05-07","context_window":1048576,"max_output_tokens":65536,"model_type":"chat","tagline":"Gemini 3.1 Flash Lite is Google’s GA high-efficiency multimodal model optimized for low-latency, high-volume workloads.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"pricing":{"input":0.25,"output":1.5,"cached_input":0.025},"tools":["function_calling"],"last_updated":"2026-05-10","knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3.1-pro-preview-customtools","name":"Google: Gemini 3.1 Pro Preview Custom Tools","created_by":"google","source":"official","last_updated":"2026-05-17","family":"gemini-3.1","description":"Gemini 3.1 Pro Preview Custom Tools is a variant of Gemini 3.1 Pro that improves tool selection behavior by preventing overuse of a general bash tool when more efficient third-party...","context_window":1048756,"max_output_tokens":65536,"modalities":{"input":["text","audio","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":2,"output":12,"cached_input":0.2},"model_type":"chat","release_date":"2026-02-25","tagline":"Gemini 3.1 Pro Preview Custom Tools is a variant of Gemini 3.1 Pro that improves tool selection behavior by preventing overuse of a general bash tool when more efficient third-party or user-defined fu","tools":["function_calling"]},{"id":"google/gemini-3.1-pro-preview","name":"Google: Gemini 3.1 Pro Preview","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-3.1","description":"Gemini 3.1 Pro Preview is Google’s frontier reasoning model, delivering enhanced software engineering performance, improved agentic reliability, and more efficient token usage across complex workflows.","context_window":1048576,"max_output_tokens":65536,"modalities":{"input":["audio","image","text","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":2,"output":12,"cached_input":0.2},"model_type":"chat","release_date":"2026-02-19","tagline":"Gemini 3.1 Pro Preview is Google’s frontier reasoning model, delivering enhanced software engineering performance, improved agentic reliability, and more efficient token usage across complex workflows","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3.5-flash","name":"Google: Gemini 3.5 Flash","created_by":"google","source":"official","family":"gemini-3.5","description":"Gemini 3.5 Flash is Google's high-efficiency multimodal model, bringing near-Pro level coding and reasoning at Flash-tier cost and speed.","release_date":"2026-05-19","context_window":1048576,"max_output_tokens":65536,"model_type":"chat","tagline":"Gemini 3.5 Flash is Google's high-efficiency multimodal model, bringing near-Pro level coding and reasoning at Flash-tier cost and speed.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"pricing":{"input":1.5,"output":9,"cached_input":0.15},"tools":["function_calling"],"last_updated":"2026-05-23","knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemma-2-27b-it","name":"Google: Gemma 2 27B","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-2","description":"Gemma 2 27B by Google is an open model built from the same research and technology used to create the [Gemini models](/models?q=gemini).","context_window":8192,"max_output_tokens":2048,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.65,"output":0.65},"model_type":"chat","parameters":27,"release_date":"2024-07-13","tagline":"Gemma 2 27B by Google is an open model built from the same research and technology used to create the [Gemini models](/models?q=gemini)."},{"id":"google/gemma-2-9b-it","name":"Google: Gemma 2 9B","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemma-2","description":"Gemma 2 9B by Google is an advanced, open-source language model that sets a new standard for efficiency and performance in its size class.","context_window":8192,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.03,"output":0.09},"model_type":"chat","parameters":9,"release_date":"2024-06-28","tagline":"Gemma 2 9B by Google is an advanced, open-source language model that sets a new standard for efficiency and performance in its size class."},{"id":"google/gemma-3-12b-it:free","name":"Google: Gemma 3 12B (free)","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","context_window":32768,"max_output_tokens":8192,"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","parameters":12,"release_date":"2025-03-13","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs."},{"id":"google/gemma-3-12b-it","name":"Google: Gemma 3 12B","created_by":"google","source":"official","last_updated":"2026-06-10","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","context_window":131072,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"tool_call":true},"pricing":{"input":0.05,"output":0.15},"model_type":"chat","parameters":12,"release_date":"2025-03-13","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","max_output_tokens":16384,"tools":["function_calling"]},{"id":"google/gemma-3-27b-it:free","name":"Google: Gemma 3 27B (free)","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","context_window":131072,"max_output_tokens":8192,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"model_type":"chat","parameters":27,"release_date":"2025-03-12","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs."},{"id":"google/gemma-3-27b-it","name":"Google: Gemma 3 27B","created_by":"google","source":"official","last_updated":"2026-04-25","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"tool_call":true},"pricing":{"input":0.08,"output":0.16},"model_type":"chat","parameters":27,"release_date":"2025-03-12","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","tools":["function_calling"]},{"id":"google/gemma-3-4b-it:free","name":"Google: Gemma 3 4B (free)","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","context_window":32768,"max_output_tokens":8192,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"model_type":"chat","parameters":4,"release_date":"2025-03-13","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs."},{"id":"google/gemma-3-4b-it","name":"Google: Gemma 3 4B","created_by":"google","source":"official","last_updated":"2026-06-10","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","context_window":131072,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.05,"output":0.1},"model_type":"chat","parameters":4,"release_date":"2025-03-13","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","max_output_tokens":16384},{"id":"google/gemma-3n-e2b-it:free","name":"Google: Gemma 3n 2B (free)","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-3n","description":"Gemma 3n E2B IT is a multimodal, instruction-tuned model developed by Google DeepMind, designed to operate efficiently at an effective parameter size of 2B while leveraging a 6B architecture.","context_window":8192,"max_output_tokens":2048,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"model_type":"chat","release_date":"2025-07-09","tagline":"Gemma 3n E2B IT is a multimodal, instruction-tuned model developed by Google DeepMind, designed to operate efficiently at an effective parameter size of 2B while leveraging a 6B architecture."},{"id":"google/gemma-3n-e4b-it:free","name":"Google: Gemma 3n 4B (free)","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-3n","description":"Gemma 3n E4B-it is optimized for efficient execution on mobile and low-resource devices, such as phones, laptops, and tablets.","context_window":8192,"max_output_tokens":2048,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"model_type":"chat","release_date":"2025-05-20","tagline":"Gemma 3n E4B-it is optimized for efficient execution on mobile and low-resource devices, such as phones, laptops, and tablets."},{"id":"google/gemma-3n-e4b-it","name":"Google: Gemma 3n 4B","created_by":"google","source":"official","last_updated":"2026-06-18","family":"gemma-3n","description":"Gemma 3n E4B-it is optimized for efficient execution on mobile and low-resource devices, such as phones, laptops, and tablets.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.06,"output":0.12},"model_type":"chat","release_date":"2025-05-20","tagline":"Gemma 3n E4B-it is optimized for efficient execution on mobile and low-resource devices, such as phones, laptops, and tablets.","capabilities":{"structured_output":true,"json_mode":true}},{"id":"google/gemma-4-26b-a4b-it:free","name":"Google: Gemma 4 26B A4B (free)","created_by":"google","source":"official","family":"gemma-4","description":"Gemma 4 26B A4B IT is an instruction-tuned Mixture-of-Experts (MoE) model from Google DeepMind.","release_date":"2026-04-03","context_window":262144,"max_output_tokens":32768,"parameters":26,"active_parameters":4,"model_type":"chat","tagline":"Gemma 4 26B A4B IT is an instruction-tuned Mixture-of-Experts (MoE) model from Google DeepMind.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["image","text","video"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-08"},{"id":"google/gemma-4-26b-a4b-it","name":"Google: Gemma 4 26B A4B ","created_by":"google","source":"official","family":"gemma-4","description":"Gemma 4 26B A4B IT is an instruction-tuned Mixture-of-Experts (MoE) model from Google DeepMind.","release_date":"2026-04-03","context_window":262144,"max_output_tokens":16384,"parameters":26,"active_parameters":4,"model_type":"chat","tagline":"Gemma 4 26B A4B IT is an instruction-tuned Mixture-of-Experts (MoE) model from Google DeepMind.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["image","text","video"],"output":["text"]},"pricing":{"input":0.06,"output":0.33,"cached_input":0.04},"tools":["function_calling"],"last_updated":"2026-05-23"},{"id":"google/gemma-4-31b-it:free","name":"Google: Gemma 4 31B (free)","created_by":"google","source":"official","family":"gemma-4","description":"Gemma 4 31B Instruct is Google DeepMind's 30.7B dense multimodal model supporting text and image input with text output.","release_date":"2026-04-02","context_window":262144,"max_output_tokens":8192,"parameters":31,"model_type":"chat","tagline":"Gemma 4 31B Instruct is Google DeepMind's 30.7B dense multimodal model supporting text and image input with text output.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["image","text","video"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-18"},{"id":"google/gemma-4-31b-it","name":"Google: Gemma 4 31B","created_by":"google","source":"official","family":"gemma-4","description":"Gemma 4 31B Instruct is Google DeepMind's 30.7B dense multimodal model supporting text and image input with text output.","release_date":"2026-04-02","context_window":262144,"max_output_tokens":262144,"parameters":31,"model_type":"chat","tagline":"Gemma 4 31B Instruct is Google DeepMind's 30.7B dense multimodal model supporting text and image input with text output.","capabilities":{"structured_output":true,"reasoning":true,"json_mode":true,"tool_call":true},"modalities":{"input":["image","text","video"],"output":["text"]},"pricing":{"input":0.12,"output":0.35,"cached_input":0.09},"last_updated":"2026-06-18","tools":["function_calling"]},{"id":"google/lyria-3-clip-preview","name":"Google: Lyria 3 Clip Preview","created_by":"google","source":"official","description":"30 second duration clips are priced at $0.04 per clip.","release_date":"2026-03-30","context_window":1048576,"max_output_tokens":65536,"model_type":"tts","tagline":"30 second duration clips are priced at $0.04 per clip.","capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"tool_call":true,"reasoning":true,"batch":true,"vision":true},"modalities":{"input":["text","image"],"output":["text","audio"]},"last_updated":"2026-04-01","license":"proprietary","open_weight":false},{"id":"google/lyria-3-pro-preview","name":"Google: Lyria 3 Pro Preview","created_by":"google","source":"official","description":"Full-length songs are priced at $0.08 per song.","release_date":"2026-03-30","context_window":1048576,"max_output_tokens":65536,"model_type":"tts","tagline":"Full-length songs are priced at $0.08 per song.","capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"tool_call":true,"reasoning":true,"batch":true,"vision":true},"modalities":{"input":["text","image"],"output":["text","audio"]},"last_updated":"2026-04-01","license":"proprietary","open_weight":false},{"id":"gryphe/mythomax-l2-13b","name":"MythoMax 13B","created_by":"gryphe","source":"official","last_updated":"2026-03-24","description":"One of the highest performing and most popular fine-tunes of Llama 2 13B, with rich descriptions and roleplay.","context_window":4096,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.06,"output":0.06},"parameters":13,"release_date":"2023-07-02","tagline":"One of the highest performing and most popular fine-tunes of Llama 2 13B, with rich descriptions and roleplay."},{"id":"ibm-granite/granite-4.0-h-micro","name":"IBM: Granite 4.0 Micro","created_by":"ibm-granite","source":"official","last_updated":"2026-06-18","description":"Granite-4.0-H-Micro is a 3B parameter from the Granite 4 family of models.","context_window":131000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.017,"output":0.112},"release_date":"2025-10-20","tagline":"Granite-4.0-H-Micro is a 3B parameter from the Granite 4 family of models.","model_type":"chat","max_output_tokens":131000,"capabilities":{"structured_output":true,"json_mode":true}},{"id":"ibm-granite/granite-4.1-8b","name":"IBM: Granite 4.1 8B","created_by":"ibm-granite","source":"official","description":"Granite 4.1 8B is a dense, decoder-only 8-billion-parameter language model from IBM, part of the Granite 4.1 family.","release_date":"2026-04-30","context_window":131072,"max_output_tokens":131072,"parameters":8,"model_type":"chat","tagline":"Granite 4.1 8B is a dense, decoder-only 8-billion-parameter language model from IBM, part of the Granite 4.1 family.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.05,"output":0.1,"cached_input":0.05},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"inception/mercury-2","name":"Inception: Mercury 2","created_by":"inception","source":"official","last_updated":"2026-03-24","description":"Mercury 2 is an extremely fast reasoning LLM, and the first reasoning diffusion LLM (dLLM).","context_window":128000,"max_output_tokens":50000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true},"pricing":{"input":0.25,"output":0.75,"cached_input":0.025},"release_date":"2026-03-04","tagline":"Mercury 2 is an extremely fast reasoning LLM, and the first reasoning diffusion LLM (dLLM).","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"inception/mercury-coder","name":"Inception: Mercury Coder","created_by":"inception","source":"official","last_updated":"2026-04-03","description":"Mercury Coder is the first diffusion large language model (dLLM).","context_window":128000,"max_output_tokens":32000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true},"pricing":{"input":0.25,"output":0.75,"cached_input":0.025},"release_date":"2025-04-30","tagline":"Mercury Coder is the first diffusion large language model (dLLM).","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-04-15","license":"proprietary","open_weight":false},{"id":"inception/mercury","name":"Inception: Mercury","created_by":"inception","source":"official","last_updated":"2026-03-24","description":"Mercury is the first diffusion large language model (dLLM).","status":"deprecated","deprecation_date":"2026-04-15","context_window":128000,"max_output_tokens":32000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true},"pricing":{"input":0.25,"output":0.75,"cached_input":0.025},"release_date":"2025-06-26","tagline":"Mercury is the first diffusion large language model (dLLM).","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"inclusionai/ling-2.6-1t:free","name":"inclusionAI: Ling-2.6-1T (free)","created_by":"inclusionai","source":"official","description":"Ling-2.6-1T is an instant (instruct) model from inclusionAI and the company’s trillion-parameter flagship, designed for real-world agents that require fast execution and high efficiency at scale.","status":"deprecated","release_date":"2026-04-23","deprecation_date":"2026-05-07","context_window":262144,"max_output_tokens":32768,"tagline":"Ling-2.6-1T is an instant (instruct) model from inclusionAI and the company’s trillion-parameter flagship, designed for real-world agents that require fast execution and high efficiency at scale.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"inclusionai/ling-2.6-1t","name":"inclusionAI: Ling-2.6-1T","created_by":"inclusionai","source":"official","description":"Ling-2.6-1T is an instant (instruct) model from inclusionAI and the company’s trillion-parameter flagship, designed for real-world agents that require fast execution and high efficiency at scale.","release_date":"2026-04-23","context_window":262144,"max_output_tokens":32768,"tagline":"Ling-2.6-1T is an instant (instruct) model from inclusionAI and the company’s trillion-parameter flagship, designed for real-world agents that require fast execution and high efficiency at scale.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.075,"output":0.625,"cached_input":0.015},"tools":["function_calling"],"last_updated":"2026-05-23"},{"id":"inclusionai/ling-2.6-flash:free","name":"inclusionAI: Ling-2.6-flash (free)","created_by":"inclusionai","source":"official","description":"Ling-2.6-flash is an instant (instruct) model from inclusionAI with 104B total parameters and 7.4B active parameters, designed for real-world agents that require fast responses, strong execution, and ","release_date":"2026-04-21","context_window":262144,"max_output_tokens":32768,"tagline":"Ling-2.6-flash is an instant (instruct) model from inclusionAI with 104B total parameters and 7.4B active parameters, designed for real-world agents that require fast responses, strong execution, and ","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-24","status":"deprecated","deprecation_date":"2026-04-29"},{"id":"inclusionai/ling-2.6-flash","name":"inclusionAI: Ling-2.6-flash","created_by":"inclusionai","source":"official","description":"Ling-2.6-flash is an instant (instruct) model from inclusionAI with 104B total parameters and 7.4B active parameters, designed for real-world agents that require fast responses, strong execution, and ","release_date":"2026-04-21","context_window":262144,"max_output_tokens":32768,"tagline":"Ling-2.6-flash is an instant (instruct) model from inclusionAI with 104B total parameters and 7.4B active parameters, designed for real-world agents that require fast responses, strong execution, and ","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.01,"output":0.03,"cached_input":0.002},"tools":["function_calling"],"last_updated":"2026-05-17"},{"id":"inclusionai/ring-2.6-1t:free","name":"inclusionAI: Ring-2.6-1T (free)","created_by":"inclusionai","source":"official","description":"Ring-2.6-1T is a 1T-parameter-scale thinking model with 63B active parameters, built for real-world agent workflows that require both strong capability and operational efficiency.","release_date":"2026-05-08","context_window":262144,"max_output_tokens":65536,"tagline":"Ring-2.6-1T is a 1T-parameter-scale thinking model with 63B active parameters, built for real-world agent workflows that require both strong capability and operational efficiency.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-10"},{"id":"inclusionai/ring-2.6-1t","name":"inclusionAI: Ring-2.6-1T","created_by":"inclusionai","source":"official","description":"Ring-2.6-1T is a 1T-parameter-scale thinking model with 63B active parameters, built for real-world agent workflows that require both strong capability and operational efficiency.","release_date":"2026-05-08","context_window":262144,"max_output_tokens":65536,"tagline":"Ring-2.6-1T is a 1T-parameter-scale thinking model with 63B active parameters, built for real-world agent workflows that require both strong capability and operational efficiency.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.075,"output":0.625,"cached_input":0.015},"tools":["function_calling"],"last_updated":"2026-06-03"},{"id":"inflection/inflection-3-pi","name":"Inflection: Inflection 3 Pi","created_by":"inflection","source":"official","last_updated":"2026-03-23","description":"Inflection 3 Pi powers Inflection's [Pi](https://pi.ai) chatbot, including backstory, emotional intelligence, productivity, and safety.","context_window":8000,"max_output_tokens":1024,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":2.5,"output":10},"release_date":"2024-10-11","tagline":"Inflection 3 Pi powers Inflection's [Pi](https://pi.ai) chatbot, including backstory, emotional intelligence, productivity, and safety."},{"id":"inflection/inflection-3-productivity","name":"Inflection: Inflection 3 Productivity","created_by":"inflection","source":"official","last_updated":"2026-03-23","description":"Inflection 3 Productivity is optimized for following instructions.","context_window":8000,"max_output_tokens":1024,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":2.5,"output":10},"release_date":"2024-10-11","tagline":"Inflection 3 Productivity is optimized for following instructions."},{"id":"kwaipilot/kat-coder-pro-v2","name":"Kwaipilot: KAT-Coder-Pro V2","created_by":"kwaipilot","source":"official","description":"KAT-Coder-Pro V2 is the latest high-performance model in KwaiKAT’s KAT-Coder series, designed for complex enterprise-grade software engineering and SaaS integration.","release_date":"2026-03-27","context_window":256000,"max_output_tokens":80000,"tagline":"KAT-Coder-Pro V2 is the latest high-performance model in KwaiKAT’s KAT-Coder series, designed for complex enterprise-grade software engineering and SaaS integration.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.3,"output":1.2,"cached_input":0.06},"tools":["function_calling"],"last_updated":"2026-04-01"},{"id":"kwaipilot/kat-coder-pro","name":"Kwaipilot: KAT-Coder-Pro V1","created_by":"kwaipilot","source":"official","last_updated":"2026-03-24","description":"KAT-Coder-Pro V1 is KwaiKAT's most advanced agentic coding model in the KAT-Coder series.","context_window":256000,"max_output_tokens":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.207,"output":0.828,"cached_input":0.041},"release_date":"2025-11-10","tagline":"KAT-Coder-Pro V1 is KwaiKAT's most advanced agentic coding model in the KAT-Coder series.","tools":["function_calling"]},{"id":"liquid/lfm-2-24b-a2b","name":"LiquidAI: LFM2-24B-A2B","created_by":"liquid","source":"official","last_updated":"2026-06-18","description":"LFM2-24B-A2B is the largest model in the LFM2 family of hybrid architectures designed for efficient on-device deployment.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.03,"output":0.12},"parameters":24,"active_parameters":2,"release_date":"2026-02-25","tagline":"LFM2-24B-A2B is the largest model in the LFM2 family of hybrid architectures designed for efficient on-device deployment.","model_type":"chat","capabilities":{"structured_output":true,"json_mode":true}},{"id":"liquid/lfm-2.2-6b","name":"LiquidAI: LFM2-2.6B","created_by":"liquid","source":"official","last_updated":"2026-03-23","description":"LFM2 is a new generation of hybrid models developed by Liquid AI, specifically designed for edge AI and on-device deployment.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.01,"output":0.02},"parameters":6,"release_date":"2025-10-20","tagline":"LFM2 is a new generation of hybrid models developed by Liquid AI, specifically designed for edge AI and on-device deployment.","model_type":"chat"},{"id":"liquid/lfm-2.5-1.2b-instruct:free","name":"LiquidAI: LFM2.5-1.2B-Instruct (free)","created_by":"liquid","source":"official","last_updated":"2026-06-18","description":"LFM2.5-1.2B-Instruct is a compact, high-performance instruction-tuned model built for fast on-device AI.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"parameters":1.2,"release_date":"2026-01-20","tagline":"LFM2.5-1.2B-Instruct is a compact, high-performance instruction-tuned model built for fast on-device AI.","model_type":"chat","capabilities":{"structured_output":true,"json_mode":true}},{"id":"liquid/lfm-2.5-1.2b-thinking:free","name":"LiquidAI: LFM2.5-1.2B-Thinking (free)","created_by":"liquid","source":"official","last_updated":"2026-06-18","description":"LFM2.5-1.2B-Thinking is a lightweight reasoning-focused model optimized for agentic tasks, data extraction, and RAG—while still running comfortably on edge devices.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"reasoning":true,"tool_call":true,"structured_output":true,"json_mode":true},"parameters":1.2,"release_date":"2026-01-20","tagline":"LFM2.5-1.2B-Thinking is a lightweight reasoning-focused model optimized for agentic tasks, data extraction, and RAG—while still running comfortably on edge devices.","model_type":"chat","tools":["function_calling"]},{"id":"liquid/lfm2-8b-a1b","name":"LiquidAI: LFM2-8B-A1B","created_by":"liquid","source":"official","last_updated":"2026-03-23","description":"LFM2-8B-A1B is an efficient on-device Mixture-of-Experts (MoE) model from Liquid AI’s LFM2 family, built for fast, high-quality inference on edge hardware.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.01,"output":0.02},"parameters":8,"active_parameters":1,"release_date":"2025-10-20","tagline":"LFM2-8B-A1B is an efficient on-device Mixture-of-Experts (MoE) model from Liquid AI’s LFM2 family, built for fast, high-quality inference on edge hardware.","model_type":"chat"},{"id":"mancer/weaver","name":"Mancer: Weaver (alpha)","created_by":"mancer","source":"official","last_updated":"2026-03-24","description":"An attempt to recreate Claude-style verbosity, but don't expect the same level of coherence or memory.","context_window":8000,"max_output_tokens":2000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.75,"output":1},"release_date":"2023-08-02","tagline":"An attempt to recreate Claude-style verbosity, but don't expect the same level of coherence or memory."},{"id":"meituan/longcat-flash-chat","name":"Meituan: LongCat Flash Chat","created_by":"meituan","source":"official","last_updated":"2026-03-24","description":"LongCat-Flash-Chat is a large-scale Mixture-of-Experts (MoE) model with 560B total parameters, of which 18.6B–31.3B (≈27B on average) are dynamically activated per input.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.2,"output":0.8,"cached_input":0.2},"release_date":"2025-09-09","tagline":"LongCat-Flash-Chat is a large-scale Mixture-of-Experts (MoE) model with 560B total parameters, of which 18.6B–31.3B (≈27B on average) are dynamically activated per input.","tools":["function_calling"]},{"id":"meta-llama/llama-3-70b-instruct","name":"Meta: Llama 3 70B Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-06-10","family":"llama-3","description":"Meta's latest class of model (Llama 3) launched with a variety of sizes & flavors.","context_window":8192,"max_output_tokens":8000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.51,"output":0.74},"model_type":"chat","parameters":70,"release_date":"2024-04-18","tagline":"Meta's latest class of model (Llama 3) launched with a variety of sizes & flavors.","status":"deprecated","deprecation_date":"2026-06-19"},{"id":"meta-llama/llama-3-8b-instruct","name":"Meta: Llama 3 8B Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-06-10","family":"llama-3","description":"Meta's latest class of model (Llama 3) launched with a variety of sizes & flavors.","context_window":8192,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.14,"output":0.14},"model_type":"chat","parameters":8,"release_date":"2024-04-18","tagline":"Meta's latest class of model (Llama 3) launched with a variety of sizes & flavors.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-07"},{"id":"meta-llama/llama-3.1-405b","name":"Meta: Llama 3.1 405B (base)","created_by":"meta-llama","source":"official","last_updated":"2026-03-23","family":"llama-3.1","description":"Meta's latest class of model (Llama 3.1) launched with a variety of sizes & flavors.","context_window":32768,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":4,"output":4},"model_type":"chat","parameters":405,"release_date":"2024-08-02","tagline":"Meta's latest class of model (Llama 3.1) launched with a variety of sizes & flavors."},{"id":"meta-llama/llama-3.1-70b-instruct","name":"Meta: Llama 3.1 70B Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-04-25","family":"llama-3.1","description":"Meta's latest class of model (Llama 3.1) launched with a variety of sizes & flavors.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.4,"output":0.4},"model_type":"chat","parameters":70,"release_date":"2024-07-23","tagline":"Meta's latest class of model (Llama 3.1) launched with a variety of sizes & flavors.","tools":["function_calling"],"max_output_tokens":16384},{"id":"meta-llama/llama-3.1-8b-instruct","name":"Meta: Llama 3.1 8B Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-06-10","family":"llama-3.1","description":"Meta's latest class of model (Llama 3.1) launched with a variety of sizes & flavors.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.02,"output":0.03},"model_type":"chat","parameters":8,"release_date":"2024-07-23","tagline":"Meta's latest class of model (Llama 3.1) launched with a variety of sizes & flavors.","tools":["function_calling"]},{"id":"meta-llama/llama-3.2-11b-vision-instruct","name":"Meta: Llama 3.2 11B Vision Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-06-10","family":"llama-3.2","description":"Llama 3.2 11B Vision is a multimodal model with 11 billion parameters, designed to handle tasks combining visual and textual data.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.345,"output":0.345},"model_type":"chat","parameters":11,"release_date":"2024-09-25","tagline":"Llama 3.2 11B Vision is a multimodal model with 11 billion parameters, designed to handle tasks combining visual and textual data."},{"id":"meta-llama/llama-3.2-1b-instruct","name":"Meta: Llama 3.2 1B Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-05-23","family":"llama-3.2","description":"Llama 3.2 1B is a 1-billion-parameter language model focused on efficiently performing natural language tasks, such as summarization, dialogue, and multilingual text analysis.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.027,"output":0.201},"model_type":"chat","parameters":1,"release_date":"2024-09-25","tagline":"Llama 3.2 1B is a 1-billion-parameter language model focused on efficiently performing natural language tasks, such as summarization, dialogue, and multilingual text analysis.","max_output_tokens":60000},{"id":"meta-llama/llama-3.2-3b-instruct:free","name":"Meta: Llama 3.2 3B Instruct (free)","created_by":"meta-llama","source":"official","last_updated":"2026-03-23","family":"llama-3.2","description":"Llama 3.2 3B is a 3-billion-parameter multilingual large language model, optimized for advanced natural language processing tasks like dialogue generation, reasoning, and summarization.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"model_type":"chat","parameters":3,"release_date":"2024-09-25","tagline":"Llama 3.2 3B is a 3-billion-parameter multilingual large language model, optimized for advanced natural language processing tasks like dialogue generation, reasoning, and summarization."},{"id":"meta-llama/llama-3.2-3b-instruct","name":"Meta: Llama 3.2 3B Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-05-23","family":"llama-3.2","description":"Llama 3.2 3B is a 3-billion-parameter multilingual large language model, optimized for advanced natural language processing tasks like dialogue generation, reasoning, and summarization.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.051,"output":0.335},"model_type":"chat","parameters":3,"release_date":"2024-09-25","tagline":"Llama 3.2 3B is a 3-billion-parameter multilingual large language model, optimized for advanced natural language processing tasks like dialogue generation, reasoning, and summarization.","max_output_tokens":80000},{"id":"meta-llama/llama-3.3-70b-instruct:free","name":"Meta: Llama 3.3 70B Instruct (free)","created_by":"meta-llama","source":"official","last_updated":"2026-05-17","family":"llama-3.3","description":"The Meta Llama 3.3 multilingual large language model (LLM) is a pretrained and instruction tuned generative model in 70B (text in/text out).","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true},"model_type":"chat","parameters":70,"release_date":"2024-12-06","tagline":"The Meta Llama 3.3 multilingual large language model (LLM) is a pretrained and instruction tuned generative model in 70B (text in/text out).","tools":["function_calling"]},{"id":"meta-llama/llama-3.3-70b-instruct","name":"Meta: Llama 3.3 70B Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-04-22","family":"llama-3.3","description":"The Meta Llama 3.3 multilingual large language model (LLM) is a pretrained and instruction tuned generative model in 70B (text in/text out).","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.1,"output":0.32},"model_type":"chat","parameters":70,"release_date":"2024-12-06","tagline":"The Meta Llama 3.3 multilingual large language model (LLM) is a pretrained and instruction tuned generative model in 70B (text in/text out).","tools":["function_calling"]},{"id":"meta-llama/llama-4-maverick","name":"Meta: Llama 4 Maverick","created_by":"meta-llama","source":"official","last_updated":"2026-04-07","family":"llama-4","description":"Llama 4 Maverick 17B Instruct (128E) is a high-capacity multimodal language model from Meta, built on a mixture-of-experts (MoE) architecture with 128 experts and 17 billion active parameters per forw","context_window":1048576,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.15,"output":0.6},"model_type":"chat","release_date":"2025-04-05","tagline":"Llama 4 Maverick 17B Instruct (128E) is a high-capacity multimodal language model from Meta, built on a mixture-of-experts (MoE) architecture with 128 experts and 17 billion active parameters per forw","tools":["function_calling"]},{"id":"meta-llama/llama-4-scout","name":"Meta: Llama 4 Scout","created_by":"meta-llama","source":"official","last_updated":"2026-06-10","family":"llama-4","description":"Llama 4 Scout 17B Instruct (16E) is a mixture-of-experts (MoE) language model developed by Meta, activating 17 billion parameters out of a total of 109B.","context_window":10000000,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.1,"output":0.3},"model_type":"chat","release_date":"2025-04-05","tagline":"Llama 4 Scout 17B Instruct (16E) is a mixture-of-experts (MoE) language model developed by Meta, activating 17 billion parameters out of a total of 109B.","tools":["function_calling"]},{"id":"meta-llama/llama-guard-3-8b","name":"Llama Guard 3 8B","created_by":"meta-llama","source":"official","last_updated":"2026-05-23","family":"llama-guard","description":"Llama Guard 3 is a Llama-3.1-8B pretrained model, fine-tuned for content safety classification.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.484,"output":0.03},"model_type":"moderation","parameters":8,"release_date":"2025-02-12","tagline":"Llama Guard 3 is a Llama-3.1-8B pretrained model, fine-tuned for content safety classification.","max_output_tokens":131072},{"id":"meta-llama/llama-guard-4-12b:free","name":"Meta: Llama Guard 4 12B (free)","created_by":"meta-llama","source":"official","family":"llama-guard","description":"Llama Guard 4 is a Llama 4 Scout-derived multimodal pretrained model, fine-tuned for content safety classification.","release_date":"2025-04-30","context_window":163840,"max_output_tokens":65000,"model_type":"chat","tagline":"Llama Guard 4 is a Llama 4 Scout-derived multimodal pretrained model, fine-tuned for content safety classification.","modalities":{"input":["image","text"],"output":["text"]},"last_updated":"2026-04-16"},{"id":"meta-llama/llama-guard-4-12b","name":"Meta: Llama Guard 4 12B","created_by":"meta-llama","source":"official","last_updated":"2026-04-25","family":"llama-guard","description":"Llama Guard 4 is a Llama 4 Scout-derived multimodal pretrained model, fine-tuned for content safety classification.","context_window":163840,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.18,"output":0.18},"model_type":"moderation","parameters":12,"release_date":"2025-04-30","tagline":"Llama Guard 4 is a Llama 4 Scout-derived multimodal pretrained model, fine-tuned for content safety classification.","max_output_tokens":16384},{"id":"microsoft/phi-4-mini-instruct","name":"Microsoft: Phi 4 Mini Instruct","created_by":"microsoft","source":"official","description":"Phi-4-mini-instruct is a lightweight open model built upon synthetic data and filtered publicly available websites - with a focus on high-quality, reasoning dense data.","release_date":"2025-10-17","context_window":131072,"max_output_tokens":128000,"model_type":"chat","tagline":"Phi-4-mini-instruct is a lightweight open model built upon synthetic data and filtered publicly available websites - with a focus on high-quality, reasoning dense data.","capabilities":{"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.08,"output":0.35,"cached_input":0.08},"last_updated":"2026-05-17"},{"id":"microsoft/phi-4","name":"Microsoft: Phi 4","created_by":"microsoft","source":"official","last_updated":"2026-06-29","description":"[Microsoft Research](/microsoft) Phi-4 is designed to perform well in complex reasoning tasks and can operate efficiently in situations with limited memory or where quick responses are needed.","context_window":16384,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.07,"output":0.14},"release_date":"2025-01-10","tagline":"[Microsoft Research](/microsoft) Phi-4 is designed to perform well in complex reasoning tasks and can operate efficiently in situations with limited memory or where quick responses are needed.","model_type":"chat"},{"id":"microsoft/wizardlm-2-8x22b","name":"WizardLM-2 8x22B","created_by":"microsoft","source":"official","last_updated":"2026-05-17","description":"WizardLM-2 8x22B is Microsoft AI's most advanced Wizard model.","context_window":65536,"max_output_tokens":8000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.62,"output":0.62},"release_date":"2024-04-16","tagline":"WizardLM-2 8x22B is Microsoft AI's most advanced Wizard model.","capabilities":{"structured_output":true,"json_mode":true}},{"id":"minimax/minimax-01","name":"MiniMax: MiniMax-01","created_by":"minimax","source":"official","last_updated":"2026-03-23","description":"MiniMax-01 is a combines MiniMax-Text-01 for text generation and MiniMax-VL-01 for image understanding.","context_window":1000192,"max_output_tokens":1000192,"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":1.1},"model_type":"chat","family":"minimax","release_date":"2025-01-15","tagline":"MiniMax-01 is a combines MiniMax-Text-01 for text generation and MiniMax-VL-01 for image understanding."},{"id":"minimax/minimax-m1","name":"MiniMax: MiniMax M1","created_by":"minimax","source":"official","last_updated":"2026-03-23","description":"MiniMax-M1 is a large-scale, open-weight reasoning model designed for extended context and high-efficiency inference.","context_window":1000000,"max_output_tokens":40000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"pricing":{"input":0.4,"output":2.2},"model_type":"chat","family":"minimax","release_date":"2025-06-17","tagline":"MiniMax-M1 is a large-scale, open-weight reasoning model designed for extended context and high-efficiency inference.","tools":["function_calling"]},{"id":"minimax/minimax-m2-her","name":"MiniMax: MiniMax M2-her","created_by":"minimax","source":"official","last_updated":"2026-03-23","description":"MiniMax M2-her is a dialogue-first large language model built for immersive roleplay, character-driven chat, and expressive multi-turn conversations.","context_window":65536,"max_output_tokens":2048,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.3,"output":1.2,"cached_input":0.03},"model_type":"chat","family":"minimax","release_date":"2026-01-23","tagline":"MiniMax M2-her is a dialogue-first large language model built for immersive roleplay, character-driven chat, and expressive multi-turn conversations."},{"id":"minimax/minimax-m2.1","name":"MiniMax: MiniMax M2.1","created_by":"minimax","source":"official","last_updated":"2026-05-17","description":"MiniMax-M2.1 is a lightweight, state-of-the-art large language model optimized for coding, agentic workflows, and modern application development.","context_window":204800,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.29,"output":0.95,"cached_input":0.03},"family":"minimax","model_type":"chat","release_date":"2025-12-23","tagline":"MiniMax-M2.1 is a lightweight, state-of-the-art large language model optimized for coding, agentic workflows, and modern application development.","tools":["function_calling"],"max_output_tokens":196608,"license":"mit","open_weight":true},{"id":"minimax/minimax-m2.5:free","name":"MiniMax: MiniMax M2.5 (free)","created_by":"minimax","source":"official","last_updated":"2026-05-17","description":"MiniMax-M2.5 is a SOTA large language model designed for real-world productivity.","context_window":204800,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"family":"minimax","model_type":"chat","release_date":"2026-02-12","tagline":"MiniMax-M2.5 is a SOTA large language model designed for real-world productivity.","tools":["function_calling"]},{"id":"minimax/minimax-m2.5","name":"MiniMax: MiniMax M2.5","created_by":"minimax","source":"official","last_updated":"2026-06-29","description":"MiniMax-M2.5 is a SOTA large language model designed for real-world productivity.","context_window":204800,"max_output_tokens":196608,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.12,"output":0.48,"cached_input":0.05},"family":"minimax","model_type":"chat","release_date":"2026-02-12","tagline":"MiniMax-M2.5 is a SOTA large language model designed for real-world productivity.","tools":["function_calling"],"license":"mit","open_weight":true},{"id":"minimax/minimax-m2.7","name":"MiniMax: MiniMax M2.7","created_by":"minimax","source":"official","last_updated":"2026-06-29","description":"MiniMax-M2.7 is a next-generation large language model designed for autonomous, real-world productivity and continuous improvement.","context_window":204800,"max_output_tokens":196608,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true},"pricing":{"input":0.18,"output":0.72,"cached_input":0.05},"family":"minimax","model_type":"chat","release_date":"2026-03-18","tagline":"MiniMax-M2.7 is a next-generation large language model designed for autonomous, real-world productivity and continuous improvement.","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"minimax/minimax-m2","name":"MiniMax: MiniMax M2","created_by":"minimax","source":"official","last_updated":"2026-05-17","description":"MiniMax-M2 is a compact, high-efficiency large language model optimized for end-to-end coding and agentic workflows.","context_window":204800,"max_output_tokens":196608,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true},"pricing":{"input":0.255,"output":1,"cached_input":0.03},"model_type":"chat","family":"minimax","release_date":"2025-10-23","tagline":"MiniMax-M2 is a compact, high-efficiency large language model optimized for end-to-end coding and agentic workflows.","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"minimax/minimax-m3","name":"MiniMax: MiniMax M3","created_by":"minimax","source":"official","family":"minimax","description":"MiniMax-M3 is a multimodal foundation model from MiniMax.","release_date":"2026-05-31","context_window":1048576,"max_output_tokens":512000,"model_type":"chat","tagline":"MiniMax-M3 is a multimodal foundation model from MiniMax.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.3,"output":1.2,"cached_input":0.06},"tools":["function_calling"],"last_updated":"2026-06-02","license":"proprietary","open_weight":false},{"id":"mistralai/codestral-2508","name":"Mistral: Codestral 2508","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"codestral","description":"Mistral's cutting-edge language model for coding released end of July 2025.","context_window":256000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.3,"output":0.9,"cached_input":0.03},"model_type":"code","release_date":"2025-08-01","alias":"mistralai/codestral","tagline":"Mistral's cutting-edge language model for coding released end of July 2025.","tools":["function_calling"],"license":"mnpl","open_weight":true},{"id":"mistralai/codestral","name":"Mistral: Codestral 2508","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"codestral","description":"Mistral's cutting-edge language model for coding released end of July 2025.","release_date":"2025-08-01","context_window":256000,"model_type":"code","tagline":"Mistral's cutting-edge language model for coding released end of July 2025.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.3,"output":0.9,"cached_input":0.03},"tools":["function_calling"],"snapshots":["mistralai/codestral-2508"],"license":"mnpl","open_weight":true},{"id":"mistralai/devstral-2512","name":"Mistral: Devstral 2 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"devstral","description":"Devstral 2 is a state-of-the-art open-source model by Mistral AI specializing in agentic coding.","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.4,"output":2,"cached_input":0.04},"model_type":"code","release_date":"2025-12-09","alias":"mistralai/devstral","tagline":"Devstral 2 is a state-of-the-art open-source model by Mistral AI specializing in agentic coding.","tools":["function_calling"]},{"id":"mistralai/devstral-medium","name":"Mistral: Devstral Medium","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"devstral","description":"Devstral Medium is a high-performance code generation and agentic reasoning model developed jointly by Mistral AI and All Hands AI.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true},"pricing":{"input":0.4,"output":2,"cached_input":0.04},"model_type":"chat","release_date":"2025-07-10","tagline":"Devstral Medium is a high-performance code generation and agentic reasoning model developed jointly by Mistral AI and All Hands AI.","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"mistralai/devstral-small","name":"Mistral: Devstral Small 1.1","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"devstral","description":"Devstral Small 1.1 is a 24B parameter open-weight language model for software engineering agents, developed by Mistral AI in collaboration with All Hands AI.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.1,"output":0.3,"cached_input":0.01},"model_type":"chat","release_date":"2025-07-10","tagline":"Devstral Small 1.1 is a 24B parameter open-weight language model for software engineering agents, developed by Mistral AI in collaboration with All Hands AI.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/devstral","name":"Mistral: Devstral 2 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"devstral","description":"Devstral 2 is a state-of-the-art open-source model by Mistral AI specializing in agentic coding.","release_date":"2025-12-09","context_window":262144,"model_type":"code","tagline":"Devstral 2 is a state-of-the-art open-source model by Mistral AI specializing in agentic coding.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.4,"output":2,"cached_input":0.04},"tools":["function_calling"],"snapshots":["mistralai/devstral-2512"]},{"id":"mistralai/ministral-14b-2512","name":"Mistral: Ministral 3 14B 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"ministral","description":"The largest model in the Ministral 3 family, Ministral 3 14B offers frontier capabilities and performance comparable to its larger Mistral Small 3.2 24B counterpart.","context_window":262144,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.2,"output":0.2,"cached_input":0.02},"model_type":"chat","parameters":14,"release_date":"2025-12-02","alias":"mistralai/ministral-14b","tagline":"The largest model in the Ministral 3 family, Ministral 3 14B offers frontier capabilities and performance comparable to its larger Mistral Small 3.2 24B counterpart.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/ministral-14b","name":"Mistral: Ministral 3 14B 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"ministral","description":"The largest model in the Ministral 3 family, Ministral 3 14B offers frontier capabilities and performance comparable to its larger Mistral Small 3.2 24B counterpart.","release_date":"2025-12-02","context_window":262144,"parameters":14,"model_type":"chat","tagline":"The largest model in the Ministral 3 family, Ministral 3 14B offers frontier capabilities and performance comparable to its larger Mistral Small 3.2 24B counterpart.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":0.2,"cached_input":0.02},"tools":["function_calling"],"snapshots":["mistralai/ministral-14b-2512"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/ministral-3b-2512","name":"Mistral: Ministral 3 3B 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"ministral","description":"The smallest model in the Ministral 3 family, Ministral 3 3B is a powerful, efficient tiny language model with vision capabilities.","context_window":131072,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.1,"output":0.1,"cached_input":0.01},"model_type":"chat","parameters":3,"release_date":"2025-12-02","alias":"mistralai/ministral-3b","tagline":"The smallest model in the Ministral 3 family, Ministral 3 3B is a powerful, efficient tiny language model with vision capabilities.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/ministral-3b","name":"Mistral: Ministral 3 3B 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"ministral","description":"The smallest model in the Ministral 3 family, Ministral 3 3B is a powerful, efficient tiny language model with vision capabilities.","release_date":"2025-12-02","context_window":131072,"parameters":3,"model_type":"chat","tagline":"The smallest model in the Ministral 3 family, Ministral 3 3B is a powerful, efficient tiny language model with vision capabilities.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.1,"output":0.1,"cached_input":0.01},"tools":["function_calling"],"snapshots":["mistralai/ministral-3b-2512"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/ministral-8b-2512","name":"Mistral: Ministral 3 8B 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"ministral","description":"A balanced model in the Ministral 3 family, Ministral 3 8B is a powerful, efficient tiny language model with vision capabilities.","context_window":262144,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.15,"output":0.15,"cached_input":0.015},"model_type":"chat","parameters":8,"release_date":"2025-12-02","alias":"mistralai/ministral-8b","tagline":"A balanced model in the Ministral 3 family, Ministral 3 8B is a powerful, efficient tiny language model with vision capabilities.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/ministral-8b","name":"Mistral: Ministral 3 8B 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"ministral","description":"A balanced model in the Ministral 3 family, Ministral 3 8B is a powerful, efficient tiny language model with vision capabilities.","release_date":"2025-12-02","context_window":262144,"parameters":8,"model_type":"chat","tagline":"A balanced model in the Ministral 3 family, Ministral 3 8B is a powerful, efficient tiny language model with vision capabilities.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.15,"output":0.15,"cached_input":0.015},"tools":["function_calling"],"snapshots":["mistralai/ministral-8b-2512"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-7b-instruct-v0.1","name":"Mistral: Mistral 7B Instruct v0.1","created_by":"mistral","source":"official","last_updated":"2026-05-23","description":"A 7.3B parameter model that outperforms Llama 2 13B on all benchmarks, with optimizations for speed and context length.","context_window":4096,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.11,"output":0.19},"model_type":"chat","family":"mistral-7b","parameters":7,"release_date":"2023-09-28","tagline":"A 7.3B parameter model that outperforms Llama 2 13B on all benchmarks, with optimizations for speed and context length.","status":"deprecated","deprecation_date":"2026-05-30","max_output_tokens":2824},{"id":"mistralai/mistral-large-2407","name":"Mistral Large 2407","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-large","description":"This is Mistral AI's flagship model, Mistral Large 2 (version mistral-large-2407).","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":2,"output":6,"cached_input":0.2},"model_type":"chat","release_date":"2024-11-19","alias":"mistralai/mistral-large","tagline":"This is Mistral AI's flagship model, Mistral Large 2 (version mistral-large-2407).","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-large-2411","name":"Mistral Large 2411","created_by":"mistral","source":"official","last_updated":"2026-04-07","family":"mistral-large","description":"Mistral Large 2 2411 is an update of [Mistral Large 2](/mistralai/mistral-large) released together with [Pixtral Large 2411](/mistralai/pixtral-large-2411) It provides a significant upgrade on the pre","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":2,"output":6,"cached_input":0.2},"model_type":"chat","release_date":"2024-11-19","alias":"mistralai/mistral-large","tagline":"Mistral Large 2 2411 is an update of [Mistral Large 2](/mistralai/mistral-large) released together with [Pixtral Large 2411](/mistralai/pixtral-large-2411)\n\nIt provides a significant upgrade on the pr","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-large-2512","name":"Mistral: Mistral Large 3 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-large","description":"Mistral Large 3 2512 is Mistral’s most capable model to date, featuring a sparse mixture-of-experts architecture with 41B active parameters (675B total), and released under the Apache 2.0 license.","context_window":262144,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.5,"output":1.5,"cached_input":0.05},"model_type":"chat","release_date":"2025-12-01","alias":"mistralai/mistral-large","tagline":"Mistral Large 3 2512 is Mistral’s most capable model to date, featuring a sparse mixture-of-experts architecture with 41B active parameters (675B total), and released under the Apache 2.0 license.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-large","name":"Mistral Large","created_by":"mistral","source":"official","last_updated":"2026-03-26","family":"mistral-large","description":"This is Mistral AI's flagship model, Mistral Large 2 (version `mistral-large-2407`).","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":2,"output":6,"cached_input":0.2},"model_type":"chat","release_date":"2024-02-26","tagline":"Mistral Large 3 2512 is Mistral’s most capable model to date, featuring a sparse mixture-of-experts architecture with 41B active parameters (675B total), and released under the Apache 2.0 license.","tools":["function_calling"],"snapshots":["mistralai/mistral-large-2512","mistralai/mistral-large-2411","mistralai/mistral-large-2407"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-medium-3-5","name":"Mistral: Mistral Medium 3.5","created_by":"mistral","source":"official","family":"mistral-medium","description":"Mistral Medium 3.5 is a dense 128B instruction-following model from Mistral AI.","release_date":"2026-04-30","context_window":262144,"model_type":"chat","tagline":"Mistral Medium 3.5 is a dense 128B instruction-following model from Mistral AI.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.5,"output":7.5},"tools":["function_calling"],"last_updated":"2026-05-06","license":"proprietary","open_weight":false},{"id":"mistralai/mistral-medium-3.1","name":"Mistral: Mistral Medium 3.1","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-medium","description":"Mistral Medium 3.1 is an updated version of Mistral Medium 3, which is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced operational cost.","context_window":131072,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.4,"output":2,"cached_input":0.04},"model_type":"chat","release_date":"2025-08-13","tagline":"Mistral Medium 3.1 is an updated version of Mistral Medium 3, which is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced opera","tools":["function_calling"]},{"id":"mistralai/mistral-medium-3","name":"Mistral: Mistral Medium 3","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-medium","description":"Mistral Medium 3 is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced operational cost.","context_window":131072,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.4,"output":2,"cached_input":0.04},"model_type":"chat","release_date":"2025-05-07","tagline":"Mistral Medium 3 is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced operational cost.","tools":["function_calling"]},{"id":"mistralai/mistral-nemo","name":"Mistral: Mistral Nemo","created_by":"mistral","source":"official","last_updated":"2026-05-23","description":"A 12B parameter model with a 128k token context length built by Mistral in collaboration with NVIDIA.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.02,"output":0.03},"model_type":"chat","family":"mistral-nemo","release_date":"2024-07-19","tagline":"A 12B parameter model with a 128k token context length built by Mistral in collaboration with NVIDIA.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-saba","name":"Mistral: Saba","created_by":"mistral","source":"official","last_updated":"2026-03-24","description":"Mistral Saba is a 24B-parameter language model specifically designed for the Middle East and South Asia, delivering accurate and contextually relevant responses while maintaining efficient performance.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.2,"output":0.6,"cached_input":0.02},"model_type":"chat","family":"mistral-saba","release_date":"2025-02-17","tagline":"Mistral Saba is a 24B-parameter language model specifically designed for the Middle East and South Asia, delivering accurate and contextually relevant responses while maintaining efficient performance","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-small-24b-instruct-2501","name":"Mistral: Mistral Small 3","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-small","description":"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks.","context_window":32768,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.05,"output":0.08},"model_type":"chat","parameters":24,"release_date":"2025-01-30","alias":"mistralai/mistral-small-24b-instruct","tagline":"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks.","tools":["function_calling"]},{"id":"mistralai/mistral-small-24b-instruct","name":"Mistral: Mistral Small 3","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-small","description":"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks.","release_date":"2025-01-30","context_window":32768,"max_output_tokens":16384,"parameters":24,"model_type":"chat","tagline":"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.05,"output":0.08},"tools":["function_calling"],"snapshots":["mistralai/mistral-small-24b-instruct-2501"]},{"id":"mistralai/mistral-small-2603","name":"Mistral: Mistral Small 4","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-small","description":"Mistral Small 4 is the next major release in the Mistral Small family, unifying the capabilities of several flagship Mistral models into a single system.","context_window":262144,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.15,"output":0.6,"cached_input":0.015},"model_type":"chat","release_date":"2026-03-16","alias":"mistralai/mistral-small","tagline":"Mistral Small 4 is the next major release in the Mistral Small family, unifying the capabilities of several flagship Mistral models into a single system.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-small-3.1-24b-instruct:free","name":"Mistral: Mistral Small 3.1 24B (free)","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-small","description":"Mistral Small 3.1 24B Instruct is an upgraded variant of Mistral Small 3 (2501), featuring 24 billion parameters with advanced multimodal capabilities.","status":"deprecated","deprecation_date":"2026-03-29","context_window":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"model_type":"chat","parameters":24,"release_date":"2025-03-17","tagline":"Mistral Small 3.1 24B Instruct is an upgraded variant of Mistral Small 3 (2501), featuring 24 billion parameters with advanced multimodal capabilities.","tools":["function_calling"]},{"id":"mistralai/mistral-small-3.1-24b-instruct","name":"Mistral: Mistral Small 3.1 24B","created_by":"mistral","source":"official","last_updated":"2026-05-23","family":"mistral-small","description":"Mistral Small 3.1 24B Instruct is an upgraded variant of Mistral Small 3 (2501), featuring 24 billion parameters with advanced multimodal capabilities.","context_window":128000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.351,"output":0.555,"cached_input":0.015},"model_type":"chat","parameters":24,"release_date":"2025-03-17","tagline":"Mistral Small 3.1 24B Instruct is an upgraded variant of Mistral Small 3 (2501), featuring 24 billion parameters with advanced multimodal capabilities."},{"id":"mistralai/mistral-small-3.2-24b-instruct","name":"Mistral: Mistral Small 3.2 24B","created_by":"mistral","source":"official","last_updated":"2026-04-25","family":"mistral-small","description":"Mistral-Small-3.2-24B-Instruct-2506 is an updated 24B parameter model from Mistral optimized for instruction following, repetition reduction, and improved function calling.","context_window":128000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.075,"output":0.2},"model_type":"chat","parameters":24,"release_date":"2025-06-20","tagline":"Mistral-Small-3.2-24B-Instruct-2506 is an updated 24B parameter model from Mistral optimized for instruction following, repetition reduction, and improved function calling.","tools":["function_calling"],"max_output_tokens":16384},{"id":"mistralai/mistral-small-creative","name":"Mistral: Mistral Small Creative","created_by":"mistral","source":"official","last_updated":"2026-03-23","family":"mistral-small","description":"Mistral Small Creative is an experimental small model designed for creative writing, narrative generation, roleplay and character-driven dialogue, general-purpose instruction following, and conversati","status":"deprecated","deprecation_date":"2026-04-30","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.1,"output":0.3,"cached_input":0.01},"model_type":"chat","release_date":"2025-12-16","tagline":"Mistral Small Creative is an experimental small model designed for creative writing, narrative generation, roleplay and character-driven dialogue, general-purpose instruction following, and conversati","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-small","name":"Mistral: Mistral Small 4","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-small","description":"Mistral Small 4 is the next major release in the Mistral Small family, unifying the capabilities of several flagship Mistral models into a single system.","release_date":"2026-03-16","context_window":262144,"model_type":"chat","tagline":"Mistral Small 4 is the next major release in the Mistral Small family, unifying the capabilities of several flagship Mistral models into a single system.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.15,"output":0.6,"cached_input":0.015},"tools":["function_calling"],"snapshots":["mistralai/mistral-small-2603"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mixtral-8x22b-instruct","name":"Mistral: Mixtral 8x22B Instruct","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mixtral","description":"Mistral's official instruct fine-tuned version of [Mixtral 8x22B](/models/mistralai/mixtral-8x22b).","context_window":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":2,"output":6,"cached_input":0.2},"model_type":"chat","release_date":"2024-04-17","tagline":"Mistral's official instruct fine-tuned version of [Mixtral 8x22B](/models/mistralai/mixtral-8x22b).","tools":["function_calling"]},{"id":"mistralai/mixtral-8x7b-instruct","name":"Mistral: Mixtral 8x7B Instruct","created_by":"mistral","source":"official","last_updated":"2026-05-07","family":"mixtral","description":"Mixtral 8x7B Instruct is a pretrained generative Sparse Mixture of Experts, by Mistral AI, for chat and instruction use.","context_window":32768,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.54,"output":0.54},"model_type":"chat","release_date":"2023-12-10","tagline":"Mixtral 8x7B Instruct is a pretrained generative Sparse Mixture of Experts, by Mistral AI, for chat and instruction use.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-07"},{"id":"mistralai/pixtral-12b","name":"Mistral: Pixtral 12B","created_by":"mistral","source":"official","last_updated":"2026-03-23","family":"pixtral","description":"The first multi-modal, text+image-to-text model from Mistral AI.","context_window":32768,"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.1,"output":0.1},"model_type":"chat","parameters":12,"release_date":"2024-09-10","tagline":"The first multi-modal, text+image-to-text model from Mistral AI.","license":"apache-2.0","open_weight":true,"capabilities":{"streaming":true,"vision":true,"tool_call":true,"fine_tuning":true}},{"id":"mistralai/pixtral-large-2411","name":"Mistral: Pixtral Large 2411","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"pixtral","description":"Pixtral Large is a 124B parameter, open-weight, multimodal model built on top of [Mistral Large 2](/mistralai/mistral-large-2411).","context_window":131072,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":2,"output":6,"cached_input":0.2},"model_type":"chat","release_date":"2024-11-19","alias":"mistralai/pixtral-large","tagline":"Pixtral Large is a 124B parameter, open-weight, multimodal model built on top of [Mistral Large 2](/mistralai/mistral-large-2411).","tools":["function_calling"],"license":"mnpl","open_weight":true},{"id":"mistralai/pixtral-large","name":"Mistral: Pixtral Large 2411","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"pixtral","description":"Pixtral Large is a 124B parameter, open-weight, multimodal model built on top of [Mistral Large 2](/mistralai/mistral-large-2411).","release_date":"2024-11-19","context_window":131072,"model_type":"chat","tagline":"Pixtral Large is a 124B parameter, open-weight, multimodal model built on top of [Mistral Large 2](/mistralai/mistral-large-2411).","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":2,"output":6,"cached_input":0.2},"tools":["function_calling"],"snapshots":["mistralai/pixtral-large-2411"],"license":"mnpl","open_weight":true},{"id":"mistralai/voxtral-small-24b-2507","name":"Mistral: Voxtral Small 24B 2507","created_by":"mistral","source":"official","last_updated":"2026-03-24","description":"Voxtral Small is an enhancement of Mistral Small 3, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance.","context_window":32000,"modalities":{"input":["text","audio"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.1,"output":0.3,"cached_input":0.01},"model_type":"audio","family":"voxtral","parameters":24,"release_date":"2025-10-30","alias":"mistralai/voxtral-small-24b","tagline":"Voxtral Small is an enhancement of Mistral Small 3, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance.","tools":["function_calling"]},{"id":"mistralai/voxtral-small-24b","name":"Mistral: Voxtral Small 24B 2507","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"voxtral","description":"Voxtral Small is an enhancement of Mistral Small 3, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance.","release_date":"2025-10-30","context_window":32000,"parameters":24,"model_type":"audio","tagline":"Voxtral Small is an enhancement of Mistral Small 3, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","audio"],"output":["text"]},"pricing":{"input":0.1,"output":0.3,"cached_input":0.01},"tools":["function_calling"],"snapshots":["mistralai/voxtral-small-24b-2507"]},{"id":"moonshotai/kimi-k2-0905","name":"MoonshotAI: Kimi K2 0905","created_by":"moonshotai","source":"official","last_updated":"2026-06-29","description":"Kimi K2 0905 is the September update of [Kimi K2 0711](moonshotai/kimi-k2).","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.6,"output":2.5,"cached_input":0.15},"family":"kimi-k2","model_type":"chat","release_date":"2025-09-04","tagline":"Kimi K2 0905 is the September update of [Kimi K2 0711](moonshotai/kimi-k2).","tools":["function_calling"],"max_output_tokens":100352,"status":"deprecated","deprecation_date":"2026-05-14"},{"id":"moonshotai/kimi-k2-thinking","name":"MoonshotAI: Kimi K2 Thinking","created_by":"moonshotai","source":"official","last_updated":"2026-06-29","description":"Kimi K2 Thinking is Moonshot AI’s most advanced open reasoning model to date, extending the K2 series into agentic, long-horizon reasoning.","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.6,"output":2.5,"cached_input":0.6},"family":"kimi-k2","model_type":"chat","release_date":"2025-11-06","tagline":"Kimi K2 Thinking is Moonshot AI’s most advanced open reasoning model to date, extending the K2 series into agentic, long-horizon reasoning.","tools":["function_calling"],"max_output_tokens":262144},{"id":"moonshotai/kimi-k2.5","name":"MoonshotAI: Kimi K2.5","created_by":"moonshotai","source":"official","last_updated":"2026-06-18","description":"Kimi K2.5 is Moonshot AI's native multimodal model, delivering state-of-the-art visual coding capability and a self-directed agent swarm paradigm.","context_window":262144,"max_output_tokens":262144,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.375,"output":2.025,"cached_input":0.09},"family":"kimi-k2.5","model_type":"chat","release_date":"2026-01-27","tagline":"Kimi K2.5 is Moonshot AI's native multimodal model, delivering state-of-the-art visual coding capability and a self-directed agent swarm paradigm.","tools":["function_calling"]},{"id":"moonshotai/kimi-k2.6:free","name":"MoonshotAI: Kimi K2.6 (free)","created_by":"moonshotai","source":"official","family":"kimi-k2.6","description":"Kimi K2.6 is Moonshot AI's next-generation multimodal model, designed for long-horizon coding, coding-driven UI/UX generation, and multi-agent orchestration.","release_date":"2026-04-20","context_window":262144,"model_type":"chat","tagline":"Kimi K2.6 is Moonshot AI's next-generation multimodal model, designed for long-horizon coding, coding-driven UI/UX generation, and multi-agent orchestration.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text","image"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"moonshotai/kimi-k2.6","name":"MoonshotAI: Kimi K2.6","created_by":"moonshotai","source":"official","family":"kimi-k2.6","description":"Kimi K2.6 is Moonshot AI's next-generation multimodal model, designed for long-horizon coding, coding-driven UI/UX generation, and multi-agent orchestration.","release_date":"2026-04-20","context_window":262144,"max_output_tokens":262144,"model_type":"chat","tagline":"Kimi K2.6 is Moonshot AI's next-generation multimodal model, designed for long-horizon coding, coding-driven UI/UX generation, and multi-agent orchestration.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.55,"output":3.2,"cached_input":0.11},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"moonshotai/kimi-k2.7-code","name":"MoonshotAI: Kimi K2.7 Code","created_by":"moonshotai","source":"official","family":"kimi-k2.7","description":"MoonshotAI: Kimi K2.7 Code is a coding-focused model in Moonshot AI's Kimi K2 family, built to complete end-to-end programming tasks reliably over long contexts.","release_date":"2026-06-12","context_window":262144,"max_output_tokens":16384,"model_type":"chat","tagline":"MoonshotAI: Kimi K2.7 Code is a coding-focused model in Moonshot AI's Kimi K2 family, built to complete end-to-end programming tasks reliably over long contexts.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.74,"output":3.5,"cached_input":0.15},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"moonshotai/kimi-k2","name":"MoonshotAI: Kimi K2 0711","created_by":"moonshotai","source":"official","last_updated":"2026-06-29","description":"Kimi K2 Instruct is a large-scale Mixture-of-Experts (MoE) language model developed by Moonshot AI, featuring 1 trillion total parameters with 32 billion active per forward pass.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.57,"output":2.3},"family":"kimi-k2","model_type":"chat","release_date":"2025-07-11","tagline":"Kimi K2 Instruct is a large-scale Mixture-of-Experts (MoE) language model developed by Moonshot AI, featuring 1 trillion total parameters with 32 billion active per forward pass.","tools":["function_calling"],"max_output_tokens":100352},{"id":"morph/morph-v3-fast","name":"Morph: Morph V3 Fast","created_by":"morph","source":"official","last_updated":"2026-03-23","description":"Morph's fastest apply model for code edits.","context_window":81920,"max_output_tokens":38000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.8,"output":1.2},"release_date":"2025-07-07","tagline":"Morph's fastest apply model for code edits."},{"id":"morph/morph-v3-large","name":"Morph: Morph V3 Large","created_by":"morph","source":"official","last_updated":"2026-06-20","description":"Morph's high-accuracy apply model for complex code edits.","context_window":262144,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.9,"output":1.9},"release_date":"2025-07-07","tagline":"Morph's high-accuracy apply model for complex code edits.","capabilities":{"structured_output":true,"json_mode":true}},{"id":"nex-agi/deepseek-v3.1-nex-n1","name":"Nex AGI: DeepSeek V3.1 Nex N1","created_by":"nex-agi","source":"official","last_updated":"2026-06-03","family":"deepseek","description":"DeepSeek V3.1 Nex-N1 is the flagship release of the Nex-N1 series — a post-trained model designed to highlight agent autonomy, tool use, and real-world productivity.","context_window":131072,"max_output_tokens":163840,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.135,"output":0.5},"release_date":"2025-12-08","tagline":"DeepSeek V3.1 Nex-N1 is the flagship release of the Nex-N1 series — a post-trained model designed to highlight agent autonomy, tool use, and real-world productivity.","tools":["function_calling"],"model_type":"chat","status":"deprecated","deprecation_date":"2026-06-08"},{"id":"nex-agi/nex-n2-pro:free","name":"Nex AGI: Nex-N2-Pro (free)","created_by":"nex-agi","source":"official","description":"Nex-N2-Pro is an agentic mixture-of-experts model from Nex AGI, with 17B active parameters out of 397B total.","release_date":"2026-06-08","context_window":262144,"max_output_tokens":262144,"tagline":"Nex-N2-Pro is an agentic mixture-of-experts model from Nex AGI, with 17B active parameters out of 397B total.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-20","status":"deprecated","deprecation_date":"2026-06-22"},{"id":"nex-agi/nex-n2-pro","name":"Nex AGI: Nex-N2-Pro","created_by":"nex-agi","source":"official","description":"Nex-N2-Pro is an agentic mixture-of-experts model from Nex AGI, with 17B active parameters out of 397B total.","release_date":"2026-06-08","context_window":262144,"max_output_tokens":262144,"tagline":"Nex-N2-Pro is an agentic mixture-of-experts model from Nex AGI, with 17B active parameters out of 397B total.","capabilities":{"reasoning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":1,"cached_input":0.025},"last_updated":"2026-06-29"},{"id":"nousresearch/hermes-2-pro-llama-3-8b","name":"NousResearch: Hermes 2 Pro - Llama-3 8B","created_by":"nousresearch","source":"official","last_updated":"2026-05-29","description":"Hermes 2 Pro is an upgraded, retrained version of Nous Hermes 2, consisting of an updated and cleaned version of the OpenHermes 2.5 Dataset, as well as a newly introduced...","context_window":8192,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.14,"output":0.14},"model_type":"chat","parameters":8,"release_date":"2024-05-27","tagline":"Hermes 2 Pro is an upgraded, retrained version of Nous Hermes 2, consisting of an updated and cleaned version of the OpenHermes 2.5 Dataset, as well as a newly introduced Function Calling and JSON Mod","status":"deprecated","deprecation_date":"2026-06-05"},{"id":"nousresearch/hermes-3-llama-3.1-405b:free","name":"Nous: Hermes 3 405B Instruct (free)","created_by":"nousresearch","source":"official","last_updated":"2026-04-07","description":"Hermes 3 is a generalist language model with many improvements over Hermes 2, including advanced agentic capabilities, much better roleplaying, reasoning, multi-turn conversation, long context coheren","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"model_type":"chat","release_date":"2024-08-16","tagline":"Hermes 3 is a generalist language model with many improvements over Hermes 2, including advanced agentic capabilities, much better roleplaying, reasoning, multi-turn conversation, long context coheren"},{"id":"nousresearch/hermes-3-llama-3.1-405b","name":"Nous: Hermes 3 405B Instruct","created_by":"nousresearch","source":"official","last_updated":"2026-04-07","description":"Hermes 3 is a generalist language model with many improvements over Hermes 2, including advanced agentic capabilities, much better roleplaying, reasoning, multi-turn conversation, long context coheren","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":1,"output":1},"model_type":"chat","parameters":405,"release_date":"2024-08-16","tagline":"Hermes 3 is a generalist language model with many improvements over Hermes 2, including advanced agentic capabilities, much better roleplaying, reasoning, multi-turn conversation, long context coheren"},{"id":"nousresearch/hermes-3-llama-3.1-70b","name":"Nous: Hermes 3 70B Instruct","created_by":"nousresearch","source":"official","last_updated":"2026-06-10","description":"Hermes 3 is a generalist language model with many improvements over [Hermes 2](/models/nousresearch/nous-hermes-2-mistral-7b-dpo), including advanced agentic capabilities, much better roleplaying, rea","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.7,"output":0.7},"model_type":"chat","parameters":70,"release_date":"2024-08-18","tagline":"Hermes 3 is a generalist language model with many improvements over [Hermes 2](/models/nousresearch/nous-hermes-2-mistral-7b-dpo), including advanced agentic capabilities, much better roleplaying, rea","max_output_tokens":16384},{"id":"nousresearch/hermes-4-405b","name":"Nous: Hermes 4 405B","created_by":"nousresearch","source":"official","last_updated":"2026-03-24","description":"Hermes 4 is a large-scale reasoning model built on Meta-Llama-3.1-405B and released by Nous Research.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":1,"output":3},"model_type":"chat","parameters":405,"release_date":"2025-08-26","tagline":"Hermes 4 is a large-scale reasoning model built on Meta-Llama-3.1-405B and released by Nous Research."},{"id":"nousresearch/hermes-4-70b","name":"Nous: Hermes 4 70B","created_by":"nousresearch","source":"official","last_updated":"2026-03-24","description":"Hermes 4 70B is a hybrid reasoning model from Nous Research, built on Meta-Llama-3.1-70B.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.13,"output":0.4},"model_type":"chat","parameters":70,"release_date":"2025-08-26","tagline":"Hermes 4 70B is a hybrid reasoning model from Nous Research, built on Meta-Llama-3.1-70B."},{"id":"nvidia/llama-3.1-nemotron-70b-instruct","name":"NVIDIA: Llama 3.1 Nemotron 70B Instruct","created_by":"nvidia","source":"official","last_updated":"2026-05-07","family":"llama-3.1","description":"NVIDIA's Llama 3.1 Nemotron 70B is a language model designed for generating precise and useful responses.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":1.2,"output":1.2},"model_type":"chat","parameters":70,"release_date":"2024-10-15","tagline":"NVIDIA's Llama 3.1 Nemotron 70B is a language model designed for generating precise and useful responses.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-07"},{"id":"nvidia/llama-3.1-nemotron-ultra-253b-v1","name":"NVIDIA: Llama 3.1 Nemotron Ultra 253B v1","created_by":"nvidia","source":"official","last_updated":"2026-03-24","family":"llama-3.1","description":"Llama-3.1-Nemotron-Ultra-253B-v1 is a large language model (LLM) optimized for advanced reasoning, human-interactive chat, retrieval-augmented generation (RAG), and tool-calling tasks.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.6,"output":1.8},"model_type":"chat","parameters":253,"release_date":"2025-04-08","tagline":"Llama-3.1-Nemotron-Ultra-253B-v1 is a large language model (LLM) optimized for advanced reasoning, human-interactive chat, retrieval-augmented generation (RAG), and tool-calling tasks."},{"id":"nvidia/llama-3.3-nemotron-super-49b-v1.5","name":"NVIDIA: Llama 3.3 Nemotron Super 49B V1.5","created_by":"nvidia","source":"official","last_updated":"2026-06-10","family":"llama-3.3","description":"Llama-3.3-Nemotron-Super-49B-v1.5 is a 49B-parameter, English-centric reasoning/chat model derived from Meta’s Llama-3.3-70B-Instruct with a 128K context.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.4,"output":0.4},"model_type":"chat","parameters":49,"release_date":"2025-10-10","tagline":"Llama-3.3-Nemotron-Super-49B-v1.5 is a 49B-parameter, English-centric reasoning/chat model derived from Meta’s Llama-3.3-70B-Instruct with a 128K context.","tools":["function_calling"],"max_output_tokens":16384},{"id":"nvidia/nemotron-3-nano-30b-a3b:free","name":"NVIDIA: Nemotron 3 Nano 30B A3B (free)","created_by":"nvidia","source":"official","last_updated":"2026-03-23","description":"NVIDIA Nemotron 3 Nano 30B A3B is a small language MoE model with highest compute efficiency and accuracy for developers to build specialized agentic AI systems.","context_window":256000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-12-14","tagline":"NVIDIA Nemotron 3 Nano 30B A3B is a small language MoE model with highest compute efficiency and accuracy for developers to build specialized agentic AI systems.","tools":["function_calling"]},{"id":"nvidia/nemotron-3-nano-30b-a3b","name":"NVIDIA: Nemotron 3 Nano 30B A3B","created_by":"nvidia","source":"official","last_updated":"2026-04-25","description":"NVIDIA Nemotron 3 Nano 30B A3B is a small language MoE model with highest compute efficiency and accuracy for developers to build specialized agentic AI systems.","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.05,"output":0.2},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-12-14","tagline":"NVIDIA Nemotron 3 Nano 30B A3B is a small language MoE model with highest compute efficiency and accuracy for developers to build specialized agentic AI systems.","tools":["function_calling"],"max_output_tokens":228000},{"id":"nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free","name":"NVIDIA: Nemotron 3 Nano Omni (free)","created_by":"nvidia","source":"official","description":"NVIDIA Nemotron™ 3 Nano Omni is a 30B-A3B open multimodal model designed to function as a perception and context sub-agent in enterprise agent systems.","release_date":"2026-04-28","context_window":256000,"max_output_tokens":65536,"parameters":30,"active_parameters":3,"model_type":"reasoning","tagline":"NVIDIA Nemotron™ 3 Nano Omni is a 30B-A3B open multimodal model designed to function as a perception and context sub-agent in enterprise agent systems.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text","audio","image","video"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"nvidia/nemotron-3-super-120b-a12b:free","name":"NVIDIA: Nemotron 3 Super (free)","created_by":"nvidia","source":"official","last_updated":"2026-05-17","description":"NVIDIA Nemotron 3 Super is a 120B-parameter open hybrid MoE model, activating just 12B parameters for maximum compute efficiency and accuracy in complex multi-agent applications.","context_window":1000000,"max_output_tokens":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"model_type":"chat","parameters":120,"active_parameters":12,"release_date":"2026-03-11","tagline":"NVIDIA Nemotron 3 Super is a 120B-parameter open hybrid MoE model, activating just 12B parameters for maximum compute efficiency and accuracy in complex multi-agent applications.","tools":["function_calling"]},{"id":"nvidia/nemotron-3-super-120b-a12b","name":"NVIDIA: Nemotron 3 Super","created_by":"nvidia","source":"official","last_updated":"2026-06-29","description":"NVIDIA Nemotron 3 Super is a 120B-parameter open hybrid MoE model, activating just 12B parameters for maximum compute efficiency and accuracy in complex multi-agent applications.","context_window":1000000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.085,"output":0.4,"cached_input":0.1},"model_type":"chat","parameters":120,"active_parameters":12,"release_date":"2026-03-11","tagline":"NVIDIA Nemotron 3 Super is a 120B-parameter open hybrid MoE model, activating just 12B parameters for maximum compute efficiency and accuracy in complex multi-agent applications.","tools":["function_calling"],"max_output_tokens":16384},{"id":"nvidia/nemotron-3-ultra-550b-a55b:free","name":"NVIDIA: Nemotron 3 Ultra (free)","created_by":"nvidia","source":"official","description":"NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE).","release_date":"2026-06-04","context_window":1000000,"max_output_tokens":65536,"parameters":550,"active_parameters":55,"model_type":"chat","tagline":"NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE).","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-10"},{"id":"nvidia/nemotron-3-ultra-550b-a55b","name":"NVIDIA: Nemotron 3 Ultra","created_by":"nvidia","source":"official","description":"NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE).","release_date":"2026-06-04","context_window":1000000,"max_output_tokens":16384,"parameters":550,"active_parameters":55,"model_type":"chat","tagline":"NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE).","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.5,"output":2.2,"cached_input":0.1},"tools":["function_calling"],"last_updated":"2026-06-18"},{"id":"nvidia/nemotron-3.5-content-safety:free","name":"NVIDIA: Nemotron 3.5 Content Safety (free)","created_by":"nvidia","source":"official","description":"NVIDIA Nemotron 3.5 Content Safety is a compact 4B-parameter multimodal guardrail model from NVIDIA, fine-tuned from Google Gemma-3-4B.","release_date":"2026-06-04","context_window":128000,"max_output_tokens":8192,"model_type":"chat","tagline":"NVIDIA Nemotron 3.5 Content Safety is a compact 4B-parameter multimodal guardrail model from NVIDIA, fine-tuned from Google Gemma-3-4B.","capabilities":{"reasoning":true},"modalities":{"input":["text","image"],"output":["text"]},"last_updated":"2026-06-10"},{"id":"nvidia/nemotron-nano-12b-v2-vl:free","name":"NVIDIA: Nemotron Nano 12B 2 VL (free)","created_by":"nvidia","source":"official","last_updated":"2026-03-23","description":"NVIDIA Nemotron Nano 2 VL is a 12-billion-parameter open multimodal reasoning model designed for video understanding and document intelligence.","context_window":128000,"max_output_tokens":128000,"modalities":{"input":["image","text","video"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"model_type":"chat","parameters":12,"release_date":"2025-10-28","tagline":"NVIDIA Nemotron Nano 2 VL is a 12-billion-parameter open multimodal reasoning model designed for video understanding and document intelligence.","tools":["function_calling"]},{"id":"nvidia/nemotron-nano-12b-v2-vl","name":"NVIDIA: Nemotron Nano 12B 2 VL","created_by":"nvidia","source":"official","last_updated":"2026-05-01","description":"NVIDIA Nemotron Nano 2 VL is a 12-billion-parameter open multimodal reasoning model designed for video understanding and document intelligence.","context_window":131072,"modalities":{"input":["image","text","video"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.2,"output":0.6},"model_type":"chat","parameters":12,"release_date":"2025-10-28","tagline":"NVIDIA Nemotron Nano 2 VL is a 12-billion-parameter open multimodal reasoning model designed for video understanding and document intelligence.","max_output_tokens":16384,"status":"deprecated","deprecation_date":"2026-05-07"},{"id":"nvidia/nemotron-nano-9b-v2:free","name":"NVIDIA: Nemotron Nano 9B V2 (free)","created_by":"nvidia","source":"official","last_updated":"2026-03-24","description":"NVIDIA-Nemotron-Nano-9B-v2 is a large language model (LLM) trained from scratch by NVIDIA, and designed as a unified model for both reasoning and non-reasoning tasks.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"model_type":"chat","parameters":9,"release_date":"2025-09-05","tagline":"NVIDIA-Nemotron-Nano-9B-v2 is a large language model (LLM) trained from scratch by NVIDIA, and designed as a unified model for both reasoning and non-reasoning tasks.","tools":["function_calling"]},{"id":"nvidia/nemotron-nano-9b-v2","name":"NVIDIA: Nemotron Nano 9B V2","created_by":"nvidia","source":"official","last_updated":"2026-06-10","description":"NVIDIA-Nemotron-Nano-9B-v2 is a large language model (LLM) trained from scratch by NVIDIA, and designed as a unified model for both reasoning and non-reasoning tasks.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.04,"output":0.16},"model_type":"chat","parameters":9,"release_date":"2025-09-05","tagline":"NVIDIA-Nemotron-Nano-9B-v2 is a large language model (LLM) trained from scratch by NVIDIA, and designed as a unified model for both reasoning and non-reasoning tasks.","tools":["function_calling"],"max_output_tokens":16384,"status":"deprecated","deprecation_date":"2026-06-11"},{"id":"openai/gpt-3.5-turbo-0613","name":"OpenAI: GPT-3.5 Turbo (older v0613)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-3.5","description":"GPT-3.5 Turbo is OpenAI's fastest model.","context_window":4095,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"fine_tuning":true,"streaming":false,"vision":false,"reasoning":false,"batch":true},"pricing":{"input":1,"output":2},"model_type":"chat","release_date":"2024-01-25","tagline":"GPT-3.5 Turbo is OpenAI's fastest model.","tools":["function_calling"],"knowledge_cutoff":"2021-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-3.5-turbo-16k","name":"OpenAI: GPT-3.5 Turbo 16k","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-3.5","description":"This model offers four times the context length of gpt-3.5-turbo, allowing it to support approximately 20 pages of text in a single request at a higher cost.","context_window":16385,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":3,"output":4},"model_type":"chat","release_date":"2023-08-28","tagline":"This model offers four times the context length of gpt-3.5-turbo, allowing it to support approximately 20 pages of text in a single request at a higher cost.","tools":["function_calling"]},{"id":"openai/gpt-3.5-turbo-instruct","name":"OpenAI: GPT-3.5 Turbo Instruct","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-3.5","description":"This model is a variant of GPT-3.5 Turbo tuned for instructional prompts and omitting chat-related optimizations.","context_window":4095,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"fine_tuning":true,"streaming":false,"vision":false,"tool_call":false,"reasoning":false},"pricing":{"input":1.5,"output":2},"model_type":"chat","release_date":"2023-09-28","tagline":"This model is a variant of GPT-3.5 Turbo tuned for instructional prompts and omitting chat-related optimizations.","knowledge_cutoff":"2021-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-3.5-turbo","name":"OpenAI: GPT-3.5 Turbo","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-3.5","description":"GPT-3.5 Turbo is OpenAI's fastest model.","context_window":16385,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"fine_tuning":true,"streaming":false,"vision":false,"reasoning":false,"batch":true},"pricing":{"input":0.5,"output":1.5},"model_type":"chat","release_date":"2023-05-28","tagline":"GPT-3.5 Turbo is OpenAI's fastest model.","tools":["function_calling"],"knowledge_cutoff":"2021-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-4-0314","name":"OpenAI: GPT-4 (older v0314)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4","description":"GPT-4-0314 is the first version of GPT-4 released, with a context length of 8,192 tokens, and was supported until June 14.","context_window":8191,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":30,"output":60},"model_type":"chat","release_date":"2023-05-28","tagline":"GPT-4-0314 is the first version of GPT-4 released, with a context length of 8,192 tokens, and was supported until June 14.","tools":["function_calling"]},{"id":"openai/gpt-4-1106-preview","name":"OpenAI: GPT-4 Turbo (older v1106)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4","description":"The latest GPT-4 Turbo model with vision capabilities.","context_window":128000,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":10,"output":30},"model_type":"chat","release_date":"2023-11-06","tagline":"The latest GPT-4 Turbo model with vision capabilities.","tools":["function_calling"]},{"id":"openai/gpt-4-turbo-preview","name":"OpenAI: GPT-4 Turbo Preview","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4-turbo","description":"The preview GPT-4 model with improved instruction following, JSON mode, reproducible outputs, parallel function calling, and more.","context_window":128000,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":10,"output":30},"model_type":"chat","release_date":"2024-01-25","tagline":"The preview GPT-4 model with improved instruction following, JSON mode, reproducible outputs, parallel function calling, and more.","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"openai/gpt-4-turbo","name":"OpenAI: GPT-4 Turbo","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4-turbo","description":"The latest GPT-4 Turbo model with vision capabilities.","context_window":128000,"max_output_tokens":4096,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"reasoning":false,"batch":true},"pricing":{"input":10,"output":30},"model_type":"chat","release_date":"2024-04-09","tagline":"The latest GPT-4 Turbo model with vision capabilities.","tools":["function_calling"],"knowledge_cutoff":"2023-12","license":"proprietary","open_weight":false},{"id":"openai/gpt-4.1-mini","name":"OpenAI: GPT-4.1 Mini","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4.1","description":"GPT-4.1 Mini is a mid-sized model delivering performance competitive with GPT-4o at substantially lower latency and cost.","context_window":1047576,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"reasoning":false,"batch":true},"pricing":{"input":0.4,"output":1.6,"cached_input":0.1},"model_type":"chat","release_date":"2025-04-14","tagline":"GPT-4.1 Mini is a mid-sized model delivering performance competitive with GPT-4o at substantially lower latency and cost.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openai/gpt-4.1-nano","name":"OpenAI: GPT-4.1 Nano","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4.1","description":"For tasks that demand low latency, GPT‑4.1 nano is the fastest and cheapest model in the GPT-4.1 series.","context_window":1047576,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"reasoning":false,"batch":true},"pricing":{"input":0.1,"output":0.4,"cached_input":0.025},"model_type":"chat","release_date":"2025-04-14","tagline":"For tasks that demand low latency, GPT‑4.1 nano is the fastest and cheapest model in the GPT-4.1 series.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openai/gpt-4.1","name":"OpenAI: GPT-4.1","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4.1","description":"GPT-4.1 is a flagship large language model optimized for advanced instruction following, real-world software engineering, and long-context reasoning.","context_window":1047576,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"reasoning":false,"batch":true},"pricing":{"input":2,"output":8,"cached_input":0.5},"model_type":"chat","release_date":"2025-04-14","tagline":"GPT-4.1 is a flagship large language model optimized for advanced instruction following, real-world software engineering, and long-context reasoning.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openai/gpt-4","name":"OpenAI: GPT-4","created_by":"openai","source":"official","last_updated":"2026-04-07","family":"gpt-4","description":"OpenAI's flagship model, GPT-4 is a large-scale multimodal language model capable of solving difficult problems with greater accuracy than previous models due to its broader general knowledge and adva","context_window":8191,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true,"vision":false,"reasoning":false,"batch":true},"pricing":{"input":30,"output":60},"model_type":"chat","release_date":"2023-05-28","tagline":"OpenAI's flagship model, GPT-4 is a large-scale multimodal language model capable of solving difficult problems with greater accuracy than previous models due to its broader general knowledge and adva","tools":["function_calling"],"knowledge_cutoff":"2023-12","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o-2024-05-13","name":"OpenAI: GPT-4o (2024-05-13)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs.","context_window":128000,"max_output_tokens":4096,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"reasoning":false,"batch":true},"pricing":{"input":5,"output":15,"cached_input":1.25},"model_type":"chat","release_date":"2024-05-13","alias":"openai/gpt-4o","tagline":"GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs.","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o-2024-08-06","name":"OpenAI: GPT-4o (2024-08-06)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"The 2024-08-06 version of GPT-4o offers improved performance in structured outputs, with the ability to supply a JSON schema in the respone_format.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"reasoning":false,"batch":true},"pricing":{"input":2.5,"output":10,"cached_input":1.25},"model_type":"chat","release_date":"2024-08-06","alias":"openai/gpt-4o","tagline":"The 2024-08-06 version of GPT-4o offers improved performance in structured outputs, with the ability to supply a JSON schema in the respone_format.","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o-2024-11-20","name":"OpenAI: GPT-4o (2024-11-20)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"The 2024-11-20 version of GPT-4o offers a leveled-up creative writing ability with more natural, engaging, and tailored writing to improve relevance & readability.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"reasoning":false,"batch":true},"pricing":{"input":2.5,"output":10,"cached_input":1.25},"model_type":"chat","release_date":"2024-11-20","alias":"openai/gpt-4o","tagline":"The 2024-11-20 version of GPT-4o offers a leveled-up creative writing ability with more natural, engaging, and tailored writing to improve relevance & readability.","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o-audio-preview","name":"OpenAI: GPT-4o Audio","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"The gpt-4o-audio-preview model adds support for audio inputs as prompts.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["audio","text"],"output":["text","audio"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":false,"fine_tuning":false,"reasoning":false},"pricing":{"input":2.5,"output":10},"model_type":"chat","release_date":"2025-08-15","tagline":"The gpt-4o-audio-preview model adds support for audio inputs as prompts.","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o:extended","name":"OpenAI: GPT-4o (extended)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs.","context_window":128000,"max_output_tokens":64000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":6,"output":18},"model_type":"chat","release_date":"2024-05-13","tagline":"GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs.","tools":["function_calling"]},{"id":"openai/gpt-4o-mini-2024-07-18","name":"OpenAI: GPT-4o-mini (2024-07-18)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"reasoning":false,"batch":true},"pricing":{"input":0.15,"output":0.6,"cached_input":0.075},"model_type":"chat","release_date":"2024-07-18","alias":"openai/gpt-4o-mini","tagline":"GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs.","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o-mini-search-preview","name":"OpenAI: GPT-4o-mini Search Preview","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"GPT-4o mini Search Preview is a specialized model for web search in Chat Completions.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"tool_call":false,"fine_tuning":false,"reasoning":false},"pricing":{"input":0.15,"output":0.6},"model_type":"chat","release_date":"2025-03-12","tagline":"GPT-4o mini Search Preview is a specialized model for web search in Chat Completions.","knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o-mini","name":"OpenAI: GPT-4o-mini (2024-07-18)","created_by":"openai","source":"official","last_updated":"2026-06-29","family":"gpt-4o","description":"GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"reasoning":false,"batch":true},"pricing":{"input":0.15,"output":0.6,"cached_input":0.075},"model_type":"chat","release_date":"2024-07-18","tagline":"GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs.","tools":["function_calling"],"snapshots":["openai/gpt-4o-mini-2024-07-18"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o-search-preview","name":"OpenAI: GPT-4o Search Preview","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"GPT-4o Search Previewis a specialized model for web search in Chat Completions.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"tool_call":false,"fine_tuning":false,"reasoning":false},"pricing":{"input":2.5,"output":10},"model_type":"chat","release_date":"2025-03-12","tagline":"GPT-4o Search Previewis a specialized model for web search in Chat Completions.","knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o","name":"OpenAI: GPT-4o","created_by":"openai","source":"official","last_updated":"2026-06-03","family":"gpt-4o","description":"GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"reasoning":false,"batch":true},"pricing":{"input":2.5,"output":10,"cached_input":1.25},"model_type":"chat","release_date":"2024-05-13","tagline":"The 2024-11-20 version of GPT-4o offers a leveled-up creative writing ability with more natural, engaging, and tailored writing to improve relevance & readability.","tools":["function_calling"],"snapshots":["openai/gpt-4o-2024-11-20","openai/gpt-4o-2024-08-06","openai/gpt-4o-2024-05-13"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-5-chat","name":"OpenAI: GPT-5 Chat","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5","description":"GPT-5 Chat is designed for advanced, natural, multimodal, and context-aware conversations for enterprise applications.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":1.25,"output":10,"cached_input":0.125},"model_type":"chat","release_date":"2025-08-07","tagline":"GPT-5 Chat is designed for advanced, natural, multimodal, and context-aware conversations for enterprise applications."},{"id":"openai/gpt-5-codex","name":"OpenAI: GPT-5 Codex","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5","description":"GPT-5-Codex is a specialized version of GPT-5 optimized for software engineering and coding workflows.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":1.25,"output":10,"cached_input":0.125},"model_type":"chat","release_date":"2025-09-23","tagline":"GPT-5-Codex is a specialized version of GPT-5 optimized for software engineering and coding workflows.","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2024-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-5-image-mini","name":"OpenAI: GPT-5 Image Mini","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5","description":"GPT-5 Image Mini combines OpenAI's advanced language capabilities, powered by [GPT-5 Mini](https://openrouter.ai/openai/gpt-5-mini), with GPT Image 1 Mini for efficient image generation.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["image","text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":2.5,"output":2,"cached_input":0.25},"model_type":"chat","release_date":"2025-10-16","tagline":"GPT-5 Image Mini combines OpenAI's advanced language capabilities, powered by [GPT-5 Mini](https://openrouter.ai/openai/gpt-5-mini), with GPT Image 1 Mini for efficient image generation.","tools":["function_calling"]},{"id":"openai/gpt-5-image","name":"OpenAI: GPT-5 Image","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5","description":"[GPT-5](https://openrouter.ai/openai/gpt-5) Image combines OpenAI's GPT-5 model with state-of-the-art image generation capabilities.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["image","text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":10,"output":10,"cached_input":1.25},"model_type":"chat","release_date":"2025-10-14","tagline":"[GPT-5](https://openrouter.ai/openai/gpt-5) Image combines OpenAI's GPT-5 model with state-of-the-art image generation capabilities.","tools":["function_calling"]},{"id":"openai/gpt-5-mini","name":"OpenAI: GPT-5 Mini","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5","description":"GPT-5 Mini is a compact version of GPT-5, designed to handle lighter-weight reasoning tasks.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":0.25,"output":2,"cached_input":0.025},"model_type":"chat","release_date":"2025-08-07","tagline":"GPT-5 Mini is a compact version of GPT-5, designed to handle lighter-weight reasoning tasks.","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2024-05","license":"proprietary","open_weight":false},{"id":"openai/gpt-5-nano","name":"OpenAI: GPT-5 Nano","created_by":"openai","source":"official","last_updated":"2026-04-12","family":"gpt-5","description":"GPT-5-Nano is the smallest and fastest variant in the GPT-5 system, optimized for developer tools, rapid interactions, and ultra-low latency environments.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":0.05,"output":0.4,"cached_input":0.01},"model_type":"chat","release_date":"2025-08-07","tagline":"GPT-5-Nano is the smallest and fastest variant in the GPT-5 system, optimized for developer tools, rapid interactions, and ultra-low latency environments.","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2024-05","license":"proprietary","open_weight":false},{"id":"openai/gpt-5-pro","name":"OpenAI: GPT-5 Pro","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5","description":"GPT-5 Pro is OpenAI’s most advanced model, offering major improvements in reasoning, code quality, and user experience.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":15,"output":120},"model_type":"chat","release_date":"2025-10-06","tagline":"GPT-5 Pro is OpenAI’s most advanced model, offering major improvements in reasoning, code quality, and user experience.","tools":["function_calling"],"knowledge_cutoff":"2024-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.1-chat","name":"OpenAI: GPT-5.1 Chat","created_by":"openai","source":"official","last_updated":"2026-05-29","family":"gpt-5.1","description":"GPT-5.1 Chat (AKA Instant is the fast, lightweight member of the 5.1 family, optimized for low-latency chat while retaining strong general intelligence.","context_window":128000,"max_output_tokens":32000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":1.25,"output":10,"cached_input":0.13},"model_type":"chat","release_date":"2025-11-13","tagline":"GPT-5.1 Chat (AKA Instant is the fast, lightweight member of the 5.1 family, optimized for low-latency chat while retaining strong general intelligence.","tools":["function_calling"]},{"id":"openai/gpt-5.1-codex-max","name":"OpenAI: GPT-5.1-Codex-Max","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.1","description":"GPT-5.1-Codex-Max is OpenAI’s latest agentic coding model, designed for long-running, high-context software development tasks.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":1.25,"output":10,"cached_input":0.125},"model_type":"chat","release_date":"2025-12-04","tagline":"GPT-5.1-Codex-Max is OpenAI’s latest agentic coding model, designed for long-running, high-context software development tasks.","tools":["function_calling"],"knowledge_cutoff":"2024-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.1-codex-mini","name":"OpenAI: GPT-5.1-Codex-Mini","created_by":"openai","source":"official","last_updated":"2026-05-29","family":"gpt-5.1","description":"GPT-5.1-Codex-Mini is a smaller and faster version of GPT-5.1-Codex","context_window":400000,"max_output_tokens":100000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":0.25,"output":2,"cached_input":0.025},"model_type":"chat","release_date":"2025-11-13","tagline":"GPT-5.1-Codex-Mini is a smaller and faster version of GPT-5.1-Codex","tools":["function_calling"],"knowledge_cutoff":"2024-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.1-codex","name":"OpenAI: GPT-5.1-Codex","created_by":"openai","source":"official","last_updated":"2026-05-29","family":"gpt-5.1","description":"GPT-5.1-Codex is a specialized version of GPT-5.1 optimized for software engineering and coding workflows.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":1.25,"output":10,"cached_input":0.13},"model_type":"chat","release_date":"2025-11-13","tagline":"GPT-5.1-Codex is a specialized version of GPT-5.1 optimized for software engineering and coding workflows.","tools":["function_calling"],"knowledge_cutoff":"2024-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.1","name":"OpenAI: GPT-5.1","created_by":"openai","source":"official","last_updated":"2026-04-12","family":"gpt-5.1","description":"GPT-5.1 is the latest frontier-grade model in the GPT-5 series, offering stronger general-purpose reasoning, improved instruction adherence, and a more natural conversational style compared to GPT-5.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":1.25,"output":10,"cached_input":0.13},"model_type":"chat","release_date":"2025-11-13","tagline":"GPT-5.1 is the latest frontier-grade model in the GPT-5 series, offering stronger general-purpose reasoning, improved instruction adherence, and a more natural conversational style compared to GPT-5.","tools":["function_calling"],"knowledge_cutoff":"2024-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.2-chat","name":"OpenAI: GPT-5.2 Chat","created_by":"openai","source":"official","last_updated":"2026-05-29","family":"gpt-5.2","description":"GPT-5.2 Chat (AKA Instant) is the fast, lightweight member of the 5.2 family, optimized for low-latency chat while retaining strong general intelligence.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":1.75,"output":14,"cached_input":0.175},"model_type":"chat","release_date":"2025-12-10","tagline":"GPT-5.2 Chat (AKA Instant) is the fast, lightweight member of the 5.2 family, optimized for low-latency chat while retaining strong general intelligence.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-08-10"},{"id":"openai/gpt-5.2-codex","name":"OpenAI: GPT-5.2-Codex","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.2","description":"GPT-5.2-Codex is an upgraded version of GPT-5.1-Codex optimized for software engineering and coding workflows.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":1.75,"output":14,"cached_input":0.175},"model_type":"chat","release_date":"2026-01-14","tagline":"GPT-5.2-Codex is an upgraded version of GPT-5.1-Codex optimized for software engineering and coding workflows.","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.2-pro","name":"OpenAI: GPT-5.2 Pro","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.2","description":"GPT-5.2 Pro is OpenAI’s most advanced model, offering major improvements in agentic coding and long context performance over GPT-5 Pro.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":21,"output":168},"model_type":"chat","release_date":"2025-12-10","tagline":"GPT-5.2 Pro is OpenAI’s most advanced model, offering major improvements in agentic coding and long context performance over GPT-5 Pro.","tools":["function_calling"],"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.2","name":"OpenAI: GPT-5.2","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.2","description":"GPT-5.2 is the latest frontier-grade model in the GPT-5 series, offering stronger agentic and long context perfomance compared to GPT-5.1.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":1.75,"output":14,"cached_input":0.175},"model_type":"chat","release_date":"2025-12-10","tagline":"GPT-5.2 is the latest frontier-grade model in the GPT-5 series, offering stronger agentic and long context perfomance compared to GPT-5.1.","tools":["function_calling"],"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.3-chat","name":"OpenAI: GPT-5.3 Chat","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.3","description":"GPT-5.3 Chat is an update to ChatGPT's most-used model that makes everyday conversations smoother, more useful, and more directly helpful.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":1.75,"output":14,"cached_input":0.175},"model_type":"chat","release_date":"2026-03-03","tagline":"GPT-5.3 Chat is an update to ChatGPT's most-used model that makes everyday conversations smoother, more useful, and more directly helpful.","tools":["function_calling"]},{"id":"openai/gpt-5.3-codex","name":"OpenAI: GPT-5.3-Codex","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.3","description":"GPT-5.3-Codex is OpenAI’s most advanced agentic coding model, combining the frontier software engineering performance of GPT-5.2-Codex with the broader reasoning and professional knowledge capabilities of GPT-5.2.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":1.75,"output":14,"cached_input":0.175},"model_type":"chat","release_date":"2026-02-24","tagline":"GPT-5.3-Codex is OpenAI’s most advanced agentic coding model, combining the frontier software engineering performance of GPT-5.2-Codex with the broader reasoning and professional knowledge capabilitie","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.4-image-2","name":"OpenAI: GPT-5.4 Image 2","created_by":"openai","source":"official","family":"gpt-5.4","description":"[GPT-5.4](https://openrouter.ai/openai/gpt-5.4) Image 2 combines OpenAI's GPT-5.4 model with state-of-the-art image generation capabilities from GPT Image 2.","release_date":"2026-04-21","context_window":272000,"max_output_tokens":128000,"model_type":"chat","tagline":"[GPT-5.4](https://openrouter.ai/openai/gpt-5.4) Image 2 combines OpenAI's GPT-5.4 model with state-of-the-art image generation capabilities from GPT Image 2.","capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["image","text"],"output":["image","text"]},"pricing":{"input":8,"output":15,"cached_input":2},"last_updated":"2026-04-22"},{"id":"openai/gpt-5.4-mini","name":"OpenAI: GPT-5.4 Mini","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.4","description":"GPT-5.4 mini brings the core capabilities of GPT-5.4 to a faster, more efficient model optimized for high-throughput workloads.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":0.75,"output":4.5,"cached_input":0.075},"model_type":"chat","release_date":"2026-03-17","tagline":"GPT-5.4 mini brings the core capabilities of GPT-5.4 to a faster, more efficient model optimized for high-throughput workloads.","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.4-nano","name":"OpenAI: GPT-5.4 Nano","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.4","description":"GPT-5.4 nano is the most lightweight and cost-efficient variant of the GPT-5.4 family, optimized for speed-critical and high-volume tasks.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":0.2,"output":1.25,"cached_input":0.02},"model_type":"chat","release_date":"2026-03-17","tagline":"GPT-5.4 nano is the most lightweight and cost-efficient variant of the GPT-5.4 family, optimized for speed-critical and high-volume tasks.","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.4-pro","name":"OpenAI: GPT-5.4 Pro","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.4","description":"GPT-5.4 Pro is OpenAI's most advanced model, building on GPT-5.4's unified architecture with enhanced reasoning capabilities for complex, high-stakes tasks.","context_window":1050000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":30,"output":180},"model_type":"chat","release_date":"2026-03-05","tagline":"GPT-5.4 Pro is OpenAI's most advanced model, building on GPT-5.4's unified architecture with enhanced reasoning capabilities for complex, high-stakes tasks.","tools":["function_calling"],"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.4","name":"OpenAI: GPT-5.4","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.4","description":"GPT-5.4 is OpenAI’s latest frontier model, unifying the Codex and GPT lines into a single system.","context_window":1050000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":2.5,"output":15,"cached_input":0.25},"model_type":"chat","release_date":"2026-03-05","tagline":"GPT-5.4 is OpenAI’s latest frontier model, unifying the Codex and GPT lines into a single system.","tools":["function_calling"],"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.5-pro","name":"OpenAI: GPT-5.5 Pro","created_by":"openai","source":"official","family":"gpt-5.5","description":"GPT-5.5 Pro is OpenAI’s high-capability model optimized for deep reasoning and accuracy on complex, high-stakes workloads.","release_date":"2026-04-24","context_window":1050000,"max_output_tokens":128000,"model_type":"chat","tagline":"GPT-5.5 Pro is OpenAI’s high-capability model optimized for deep reasoning and accuracy on complex, high-stakes workloads.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":false,"vision":true,"fine_tuning":false,"batch":true},"modalities":{"input":["image","text"],"output":["text"]},"pricing":{"input":30,"output":180},"tools":["function_calling"],"last_updated":"2026-04-25","knowledge_cutoff":"2025-12","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.5","name":"OpenAI: GPT-5.5","created_by":"openai","source":"official","family":"gpt-5.5","description":"GPT-5.5 is OpenAI’s frontier model designed for complex professional workloads, building on GPT-5.4 with stronger reasoning, higher reliability, and improved token efficiency on hard tasks.","release_date":"2026-04-24","context_window":1050000,"max_output_tokens":128000,"model_type":"chat","tagline":"GPT-5.5 is OpenAI’s frontier model designed for complex professional workloads, building on GPT-5.4 with stronger reasoning, higher reliability, and improved token efficiency on hard tasks.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"modalities":{"input":["image","text"],"output":["text"]},"pricing":{"input":5,"output":30,"cached_input":0.5},"tools":["function_calling"],"last_updated":"2026-04-25","knowledge_cutoff":"2025-12","license":"proprietary","open_weight":false},{"id":"openai/gpt-5","name":"OpenAI: GPT-5","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5","description":"GPT-5 is OpenAI’s most advanced model, offering major improvements in reasoning, code quality, and user experience.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":1.25,"output":10,"cached_input":0.125},"model_type":"chat","release_date":"2025-08-07","tagline":"GPT-5 is OpenAI’s most advanced model, offering major improvements in reasoning, code quality, and user experience.","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2024-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-audio-mini","name":"OpenAI: GPT Audio Mini","created_by":"openai","source":"official","last_updated":"2026-04-01","family":"gpt-audio","description":"A cost-efficient version of GPT Audio.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","audio"],"output":["text","audio"]},"capabilities":{"structured_output":true,"json_mode":true,"tool_call":true,"streaming":false,"vision":false,"fine_tuning":false,"reasoning":false},"pricing":{"input":0.6,"output":2.4},"release_date":"2026-01-19","tagline":"A cost-efficient version of GPT Audio.","model_type":"chat","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-audio","name":"OpenAI: GPT Audio","created_by":"openai","source":"official","last_updated":"2026-04-01","family":"gpt-audio","description":"The gpt-audio model is OpenAI's first generally available audio model.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","audio"],"output":["text","audio"]},"capabilities":{"structured_output":true,"json_mode":true,"tool_call":true,"streaming":true,"vision":false,"fine_tuning":false,"reasoning":false},"pricing":{"input":2.5,"output":10},"release_date":"2026-01-19","tagline":"The gpt-audio model is OpenAI's first generally available audio model.","model_type":"chat","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-chat-latest","name":"OpenAI: GPT Chat Latest","created_by":"openai","source":"official","description":"GPT Chat Latest points to OpenAI's stable API alias `chat-latest` that always resolves to the latest Instant chat model used in ChatGPT.","release_date":"2026-05-05","context_window":400000,"max_output_tokens":128000,"tagline":"GPT Chat Latest points to OpenAI's stable API alias `chat-latest` that always resolves to the latest Instant chat model used in ChatGPT.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5,"output":30,"cached_input":0.5},"tools":["function_calling"],"last_updated":"2026-05-06"},{"id":"openai/gpt-oss-120b:free","name":"OpenAI: gpt-oss-120b (free)","created_by":"openai","source":"official","last_updated":"2026-03-23","family":"gpt-oss","description":"gpt-oss-120b is an open-weight, 117B-parameter Mixture-of-Experts (MoE) language model from OpenAI designed for high-reasoning, agentic, and general-purpose production use cases.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"model_type":"chat","release_date":"2025-08-05","tagline":"gpt-oss-120b is an open-weight, 117B-parameter Mixture-of-Experts (MoE) language model from OpenAI designed for high-reasoning, agentic, and general-purpose production use cases.","tools":["function_calling"]},{"id":"openai/gpt-oss-120b","name":"OpenAI: gpt-oss-120b","created_by":"openai","source":"official","last_updated":"2026-06-29","family":"gpt-oss","description":"gpt-oss-120b is an open-weight, 117B-parameter Mixture-of-Experts (MoE) language model from OpenAI designed for high-reasoning, agentic, and general-purpose production use cases.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":false,"vision":false,"batch":true},"pricing":{"input":0.03,"output":0.15},"model_type":"chat","parameters":120,"release_date":"2025-08-05","tagline":"gpt-oss-120b is an open-weight, 117B-parameter Mixture-of-Experts (MoE) language model from OpenAI designed for high-reasoning, agentic, and general-purpose production use cases.","tools":["function_calling"],"max_output_tokens":131072,"knowledge_cutoff":"2024-06","license":"apache-2.0","open_weight":true},{"id":"openai/gpt-oss-20b:free","name":"OpenAI: gpt-oss-20b (free)","created_by":"openai","source":"official","last_updated":"2026-06-18","family":"gpt-oss","description":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.0 license.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true},"model_type":"chat","release_date":"2025-08-05","tagline":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.0 license.","tools":["function_calling"]},{"id":"openai/gpt-oss-20b","name":"OpenAI: gpt-oss-20b","created_by":"openai","source":"official","last_updated":"2026-06-02","family":"gpt-oss","description":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.0 license.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":false,"vision":false,"batch":true},"pricing":{"input":0.029,"output":0.14,"cached_input":0.015},"model_type":"chat","parameters":20,"release_date":"2025-08-05","tagline":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.0 license.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"apache-2.0","open_weight":true},{"id":"openai/gpt-oss-safeguard-20b","name":"OpenAI: gpt-oss-safeguard-20b","created_by":"openai","source":"official","last_updated":"2026-06-20","family":"gpt-oss","description":"gpt-oss-safeguard-20b is a safety reasoning model from OpenAI built upon gpt-oss-20b.","context_window":131072,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.075,"output":0.3,"cached_input":0.038},"model_type":"moderation","parameters":20,"release_date":"2025-10-29","tagline":"gpt-oss-safeguard-20b is a safety reasoning model from OpenAI built upon gpt-oss-20b.","tools":["function_calling"]},{"id":"openai/o1-pro","name":"OpenAI: o1-pro","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o1","description":"The o1 series of models are trained with reinforcement learning to think before they answer and perform complex reasoning.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true,"vision":true,"tool_call":true,"streaming":false,"fine_tuning":false,"batch":true},"pricing":{"input":150,"output":600},"model_type":"reasoning","release_date":"2025-03-19","tagline":"The o1 series of models are trained with reinforcement learning to think before they answer and perform complex reasoning.","knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/o1","name":"OpenAI: o1","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o1","description":"The latest and strongest model family from OpenAI, o1 is designed to spend more time thinking before responding.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":15,"output":60,"cached_input":7.5},"model_type":"reasoning","release_date":"2024-12-17","tagline":"The latest and strongest model family from OpenAI, o1 is designed to spend more time thinking before responding.","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/o3-deep-research","name":"OpenAI: o3 Deep Research","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o3","description":"o3-deep-research is OpenAI's advanced model for deep research, designed to tackle complex, multi-step research tasks.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":10,"output":40,"cached_input":2.5},"model_type":"chat","release_date":"2025-10-10","tagline":"o3-deep-research is OpenAI's advanced model for deep research, designed to tackle complex, multi-step research tasks.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openai/o3-mini-high","name":"OpenAI: o3 Mini High","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o3","description":"OpenAI o3-mini-high is the same model as [o3-mini](/openai/o3-mini) with reasoning_effort set to high.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":1.1,"output":4.4,"cached_input":0.55},"model_type":"reasoning","release_date":"2025-02-12","tagline":"OpenAI o3-mini-high is the same model as [o3-mini](/openai/o3-mini) with reasoning_effort set to high.","tools":["function_calling"]},{"id":"openai/o3-mini","name":"OpenAI: o3 Mini","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o3","description":"OpenAI o3-mini is a cost-efficient language model optimized for STEM reasoning tasks, particularly excelling in science, mathematics, and coding.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":false,"fine_tuning":false,"batch":true},"pricing":{"input":1.1,"output":4.4,"cached_input":0.55},"model_type":"reasoning","release_date":"2025-01-31","tagline":"OpenAI o3-mini is a cost-efficient language model optimized for STEM reasoning tasks, particularly excelling in science, mathematics, and coding.","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/o3-pro","name":"OpenAI: o3 Pro","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o3","description":"The o-series of models are trained with reinforcement learning to think before they answer and perform complex reasoning.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"vision":true,"streaming":false,"fine_tuning":false,"batch":true},"pricing":{"input":20,"output":80},"model_type":"reasoning","release_date":"2025-06-10","tagline":"The o-series of models are trained with reinforcement learning to think before they answer and perform complex reasoning.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openai/o3","name":"OpenAI: o3","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o3","description":"o3 is a well-rounded and powerful model across domains.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":2,"output":8,"cached_input":0.5},"model_type":"reasoning","release_date":"2025-04-16","tagline":"o3 is a well-rounded and powerful model across domains.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openai/o4-mini-deep-research","name":"OpenAI: o4 Mini Deep Research","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o4","description":"o4-mini-deep-research is OpenAI's faster, more affordable deep research model—ideal for tackling complex, multi-step research tasks.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":2,"output":8,"cached_input":0.5},"model_type":"chat","release_date":"2025-10-10","tagline":"o4-mini-deep-research is OpenAI's faster, more affordable deep research model—ideal for tackling complex, multi-step research tasks.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openai/o4-mini-high","name":"OpenAI: o4 Mini High","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o4","description":"OpenAI o4-mini-high is the same model as [o4-mini](/openai/o4-mini) with reasoning_effort set to high.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":1.1,"output":4.4,"cached_input":0.275},"model_type":"reasoning","release_date":"2025-04-16","tagline":"OpenAI o4-mini-high is the same model as [o4-mini](/openai/o4-mini) with reasoning_effort set to high.","tools":["function_calling"]},{"id":"openai/o4-mini","name":"OpenAI: o4 Mini","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o4","description":"OpenAI o4-mini is a compact reasoning model in the o-series, optimized for fast, cost-efficient performance while retaining strong multimodal and agentic capabilities.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"batch":true},"pricing":{"input":1.1,"output":4.4,"cached_input":0.275},"model_type":"reasoning","release_date":"2025-04-16","tagline":"OpenAI o4-mini is a compact reasoning model in the o-series, optimized for fast, cost-efficient performance while retaining strong multimodal and agentic capabilities.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openrouter/auto","name":"Auto Router","created_by":"openrouter","source":"official","last_updated":"2026-05-10","description":"Your prompt will be processed by a meta-model and routed to one of dozens of models (see below), optimizing for the best possible output.","context_window":2000000,"modalities":{"input":["text","image","audio","video"],"output":["text","image"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"release_date":"2023-11-08","tagline":"Your prompt will be processed by a meta-model and routed to one of dozens of models (see below), optimizing for the best possible output.","tools":["function_calling"]},{"id":"openrouter/bodybuilder","name":"Body Builder (beta)","created_by":"openrouter","source":"official","last_updated":"2026-03-23","description":"Transform your natural language requests into structured OpenRouter API request objects.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"release_date":"2025-12-05","tagline":"Transform your natural language requests into structured OpenRouter API request objects."},{"id":"openrouter/elephant-alpha","name":"Elephant","created_by":"openrouter","source":"official","description":"Elephant Alpha is a 100B-parameter text model focused on intelligence efficiency, delivering strong performance while minimizing token usage.","release_date":"2026-04-13","context_window":262144,"max_output_tokens":32768,"tagline":"Elephant Alpha is a 100B-parameter text model focused on intelligence efficiency, delivering strong reasoning performance while minimizing token usage.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-16"},{"id":"openrouter/free","name":"Free Models Router","created_by":"openrouter","source":"official","last_updated":"2026-03-24","description":"The simplest way to get free inference.","context_window":200000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"release_date":"2026-02-01","tagline":"The simplest way to get free inference.","tools":["function_calling"]},{"id":"openrouter/fusion","name":"OpenRouter: Fusion","created_by":"openrouter","source":"official","description":"Fusion turns your prompt into a small multi-model deliberation.","release_date":"2026-06-13","context_window":1000000,"tagline":"Fusion turns your prompt into a small multi-model deliberation.","modalities":{"input":["text"],"output":["text"]},"last_updated":"2026-06-18"},{"id":"openrouter/owl-alpha","name":"Owl Alpha","created_by":"openrouter","source":"official","description":"Owl Alpha is a high-performance foundation model designed for agentic workloads.","release_date":"2026-04-28","context_window":1048756,"max_output_tokens":262144,"tagline":"Owl Alpha is a high-performance foundation model designed for agentic workloads.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"openrouter/pareto-code","name":"Pareto Code Router","created_by":"openrouter","source":"official","description":"The Pareto Router maintains a tiered shortlist of strong coding models, ranked by [Artificial Analysis](https://artificialanalysis.ai/) coding percentiles.","release_date":"2026-04-21","context_window":2000000,"tagline":"The Pareto Router is a way to have OpenRouter always pick a strong coding model for your needs without committing to a specific one.","modalities":{"input":["text"],"output":["text"]},"last_updated":"2026-05-10"},{"id":"perceptron/perceptron-mk1","name":"Perceptron: Perceptron Mk1","created_by":"perceptron","source":"official","description":"Perceptron Mk1 (Mark One) is Perceptron's highest-quality vision-language model for video and embodied reasoning.** It accepts image and video inputs paired with natural language queries, and produces","release_date":"2026-05-12","context_window":32768,"max_output_tokens":8192,"tagline":"Perceptron Mk1 (Mark One) is Perceptron's highest-quality vision-language model for video and embodied reasoning.** It accepts image and video inputs paired with natural language queries, and produces","capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.15,"output":1.5},"last_updated":"2026-05-14"},{"id":"perplexity/sonar-deep-research","name":"Perplexity: Sonar Deep Research","created_by":"perplexity","source":"official","last_updated":"2026-03-23","description":"Sonar Deep Research is a research-focused model designed for multi-step retrieval, synthesis, and reasoning across complex topics.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"reasoning":true},"pricing":{"input":2,"output":8},"family":"sonar","model_type":"chat","release_date":"2025-03-07","tagline":"Sonar Deep Research is a research-focused model designed for multi-step retrieval, synthesis, and reasoning across complex topics."},{"id":"perplexity/sonar-pro-search","name":"Perplexity: Sonar Pro Search","created_by":"perplexity","source":"official","last_updated":"2026-03-24","description":"Exclusively available on the OpenRouter API, Sonar Pro's new Pro Search mode is Perplexity's most advanced agentic search system.","context_window":200000,"max_output_tokens":8000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":3,"output":15},"family":"sonar","model_type":"chat","release_date":"2025-10-30","tagline":"Exclusively available on the OpenRouter API, Sonar Pro's new Pro Search mode is Perplexity's most advanced agentic search system."},{"id":"perplexity/sonar-pro","name":"Perplexity: Sonar Pro","created_by":"perplexity","source":"official","last_updated":"2026-03-23","description":"Note: Sonar Pro pricing includes Perplexity search pricing.","context_window":200000,"max_output_tokens":8000,"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":3,"output":15},"family":"sonar","model_type":"chat","release_date":"2025-03-07","tagline":"Note: Sonar Pro pricing includes Perplexity search pricing."},{"id":"perplexity/sonar-reasoning-pro","name":"Perplexity: Sonar Reasoning Pro","created_by":"perplexity","source":"official","last_updated":"2026-03-23","description":"Note: Sonar Pro pricing includes Perplexity search pricing.","context_window":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"reasoning":true},"pricing":{"input":2,"output":8},"model_type":"reasoning","family":"sonar","release_date":"2025-03-07","tagline":"Note: Sonar Pro pricing includes Perplexity search pricing."},{"id":"perplexity/sonar","name":"Perplexity: Sonar","created_by":"perplexity","source":"official","last_updated":"2026-03-23","description":"Sonar is lightweight, affordable, fast, and simple to use — now featuring citations and the ability to customize sources.","context_window":127072,"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1,"output":1},"family":"sonar","model_type":"chat","release_date":"2025-01-27","tagline":"Sonar is lightweight, affordable, fast, and simple to use — now featuring citations and the ability to customize sources."},{"id":"poolside/laguna-m.1:free","name":"Poolside: Laguna M.1 (free)","created_by":"poolside","source":"official","description":"Laguna M.1 is the flagship coding agent model from [Poolside](https://poolside.ai/), optimized for complex software engineering tasks.","release_date":"2026-04-28","context_window":262144,"max_output_tokens":32768,"tagline":"Laguna M.1 is the flagship coding agent model from [Poolside](https://poolside.ai), optimized for complex software engineering tasks.","capabilities":{"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-20"},{"id":"poolside/laguna-m.1","name":"Poolside: Laguna M.1","created_by":"poolside","source":"official","description":"Laguna M.1 is the flagship coding agent model from [Poolside](https://poolside.ai/), optimized for complex software engineering tasks.","release_date":"2026-04-28","context_window":262144,"max_output_tokens":32768,"tagline":"Laguna M.1 is the flagship coding agent model from [Poolside](https://poolside.ai/), optimized for complex software engineering tasks.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.2,"output":0.4,"cached_input":0.1},"tools":["function_calling"],"last_updated":"2026-06-20"},{"id":"poolside/laguna-xs.2:free","name":"Poolside: Laguna XS.2 (free)","created_by":"poolside","source":"official","description":"Laguna XS.2 is the second-generation model in the XS size class from [Poolside](https://poolside.ai/), their efficient coding agent series.","release_date":"2026-04-28","context_window":262144,"max_output_tokens":32768,"tagline":"Laguna XS.2 is the second-generation model in the XS size class from [Poolside](https://poolside.ai), their efficient coding agent series.","capabilities":{"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-18"},{"id":"poolside/laguna-xs.2","name":"Poolside: Laguna XS.2","created_by":"poolside","source":"official","description":"Laguna XS.2 is the second-generation model in the XS size class from [Poolside](https://poolside.ai/), their efficient coding agent series.","release_date":"2026-04-28","context_window":262144,"max_output_tokens":32768,"tagline":"Laguna XS.2 is the second-generation model in the XS size class from [Poolside](https://poolside.ai/), their efficient coding agent series.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.1,"output":0.2,"cached_input":0.05},"tools":["function_calling"],"last_updated":"2026-06-20"},{"id":"prime-intellect/intellect-3","name":"Prime Intellect: INTELLECT-3","created_by":"prime-intellect","source":"official","last_updated":"2026-03-24","description":"INTELLECT-3 is a 106B-parameter Mixture-of-Experts model (12B active) post-trained from GLM-4.5-Air-Base using supervised fine-tuning (SFT) followed by large-scale reinforcement learning (RL).","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.2,"output":1.1},"release_date":"2025-11-27","tagline":"INTELLECT-3 is a 106B-parameter Mixture-of-Experts model (12B active) post-trained from GLM-4.5-Air-Base using supervised fine-tuning (SFT) followed by large-scale reinforcement learning (RL).","tools":["function_calling"]},{"id":"qwen/qwen-2.5-72b-instruct","name":"Qwen2.5 72B Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen","description":"Qwen2.5 72B is the latest series of Qwen large language models.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true,"reasoning":true,"batch":true},"pricing":{"input":0.36,"output":0.4},"model_type":"chat","parameters":72,"release_date":"2024-09-19","tagline":"Qwen2.5 72B is the latest series of Qwen large language models.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen-2.5-7b-instruct","name":"Qwen: Qwen2.5 7B Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen","description":"Qwen2.5 7B is the latest series of Qwen large language models.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true,"reasoning":true,"batch":true},"pricing":{"input":0.04,"output":0.1},"model_type":"chat","parameters":7,"release_date":"2024-10-16","tagline":"Qwen2.5 7B is the latest series of Qwen large language models.","tools":["function_calling"],"max_output_tokens":32768,"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen-2.5-coder-32b-instruct","name":"Qwen2.5 Coder 32B Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-23","family":"qwen","description":"Qwen2.5-Coder is the latest series of Code-Specific Qwen large language models (formerly known as CodeQwen).","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.66,"output":1},"model_type":"code","parameters":32,"release_date":"2024-11-11","tagline":"Qwen2.5-Coder is the latest series of Code-Specific Qwen large language models (formerly known as CodeQwen).","max_output_tokens":32768},{"id":"qwen/qwen-2.5-vl-7b-instruct","name":"Qwen: Qwen2.5-VL 7B Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-23","family":"qwen","description":"Qwen2.5 VL 7B is a multimodal LLM from the Qwen Team with the following key enhancements:\n\n- SoTA understanding of images of various resolution & ratio: Qwen2.5-VL achieves state-of-the-art performanc","context_window":32768,"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":0.2},"model_type":"chat","parameters":7,"release_date":"2024-08-28","tagline":"Qwen2.5 VL 7B is a multimodal LLM from the Qwen Team with the following key enhancements:\n\n- SoTA understanding of images of various resolution & ratio: Qwen2.5-VL achieves state-of-the-art performanc","license":"apache-2.0","open_weight":true,"capabilities":{"streaming":true,"reasoning":true,"tool_call":true,"structured_output":true,"batch":true,"vision":true,"fine_tuning":true,"json_mode":true}},{"id":"qwen/qwen-max","name":"Qwen: Qwen-Max ","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen","description":"Qwen-Max, based on Qwen2.5, provides the best inference performance among [Qwen models](/qwen), especially for complex multi-step tasks.","context_window":32768,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true},"pricing":{"input":1.04,"output":4.16,"cached_input":0.208},"model_type":"chat","release_date":"2025-02-01","tagline":"Qwen-Max, based on Qwen2.5, provides the best inference performance among [Qwen models](/qwen), especially for complex multi-step tasks.","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"qwen/qwen-plus-2025-07-28:thinking","name":"Qwen: Qwen Plus 0728 (thinking)","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen","description":"Qwen Plus 0728, based on the Qwen3 foundation model, is a 1 million context hybrid reasoning model with a balanced performance, speed, and cost combination.","context_window":1000000,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.26,"output":0.78},"model_type":"chat","release_date":"2025-09-08","tagline":"Qwen Plus 0728, based on the Qwen3 foundation model, is a 1 million context hybrid reasoning model with a balanced performance, speed, and cost combination.","tools":["function_calling"]},{"id":"qwen/qwen-plus-2025-07-28","name":"Qwen: Qwen Plus 0728","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen","description":"Qwen Plus 0728, based on the Qwen3 foundation model, is a 1 million context hybrid reasoning model with a balanced performance, speed, and cost combination.","context_window":1000000,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.26,"output":0.78,"cached_input":0.052},"model_type":"chat","release_date":"2025-09-08","alias":"qwen/qwen-plus","tagline":"Qwen Plus 0728, based on the Qwen3 foundation model, is a 1 million context hybrid reasoning model with a balanced performance, speed, and cost combination.","tools":["function_calling"]},{"id":"qwen/qwen-plus","name":"Qwen: Qwen-Plus","created_by":"qwen","source":"official","last_updated":"2026-03-26","family":"qwen","description":"Qwen-Plus, based on the Qwen2.5 foundation model, is a 131K context model with a balanced performance, speed, and cost combination.","context_window":1000000,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true},"pricing":{"input":0.26,"output":0.78,"cached_input":0.052},"model_type":"chat","release_date":"2025-02-01","tagline":"Qwen Plus 0728, based on the Qwen3 foundation model, is a 1 million context hybrid reasoning model with a balanced performance, speed, and cost combination.","tools":["function_calling"],"snapshots":["qwen/qwen-plus-2025-07-28"],"license":"proprietary","open_weight":false},{"id":"qwen/qwen-turbo","name":"Qwen: Qwen-Turbo","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen","description":"Qwen-Turbo, based on Qwen2.5, is a 1M context model that provides fast speed and low cost, suitable for simple tasks.","context_window":131072,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true},"pricing":{"input":0.033,"output":0.13,"cached_input":0.007},"model_type":"chat","release_date":"2025-02-01","tagline":"Qwen-Turbo, based on Qwen2.5, is a 1M context model that provides fast speed and low cost, suitable for simple tasks.","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"qwen/qwen-vl-max","name":"Qwen: Qwen VL Max","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen","description":"Qwen VL Max is a visual understanding model with 7500 tokens context length.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.52,"output":2.08},"model_type":"chat","release_date":"2025-02-01","tagline":"Qwen VL Max is a visual understanding model with 7500 tokens context length.","tools":["function_calling"]},{"id":"qwen/qwen-vl-plus","name":"Qwen: Qwen VL Plus","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen","description":"Qwen's Enhanced Large Visual Language Model.","context_window":131072,"max_output_tokens":8192,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.137,"output":0.41,"cached_input":0.027},"model_type":"chat","release_date":"2025-02-05","tagline":"Qwen's Enhanced Large Visual Language Model."},{"id":"qwen/qwen2.5-coder-7b-instruct","name":"Qwen: Qwen2.5 Coder 7B Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen2.5","description":"Qwen2.5-Coder-7B-Instruct is a 7B parameter instruction-tuned language model optimized for code-related tasks such as code generation, reasoning, and bug fixing.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.03,"output":0.09},"model_type":"code","parameters":7,"release_date":"2025-04-15","tagline":"Qwen2.5-Coder-7B-Instruct is a 7B parameter instruction-tuned language model optimized for code-related tasks such as code generation, reasoning, and bug fixing."},{"id":"qwen/qwen2.5-vl-32b-instruct","name":"Qwen: Qwen2.5 VL 32B Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen2.5","description":"Qwen2.5-VL-32B is a multimodal vision-language model fine-tuned through reinforcement learning for enhanced mathematical reasoning, structured outputs, and visual problem-solving capabilities.","context_window":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"tool_call":true,"batch":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.2,"output":0.6},"model_type":"chat","parameters":32,"release_date":"2025-03-24","tagline":"Qwen2.5-VL-32B is a multimodal vision-language model fine-tuned through reinforcement learning for enhanced mathematical reasoning, structured outputs, and visual problem-solving capabilities.","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen2.5-vl-72b-instruct","name":"Qwen: Qwen2.5 VL 72B Instruct","created_by":"qwen","source":"official","last_updated":"2026-06-18","family":"qwen2.5","description":"Qwen2.5-VL is proficient in recognizing common objects such as flowers, birds, fish, and insects.","context_window":131072,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"tool_call":true,"batch":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.8,"output":1,"cached_input":0.4},"model_type":"chat","parameters":72,"release_date":"2025-02-01","tagline":"Qwen2.5-VL is proficient in recognizing common objects such as flowers, birds, fish, and insects.","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-14b","name":"Qwen: Qwen3 14B","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-14B is a dense 14.8B parameter causal language model from the Qwen3 series, designed for both complex reasoning and efficient dialogue.","context_window":131702,"max_output_tokens":40960,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.1,"output":0.24},"model_type":"chat","parameters":14,"release_date":"2025-04-28","tagline":"Qwen3-14B is a dense 14.8B parameter causal language model from the Qwen3 series, designed for both complex reasoning and efficient dialogue.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-235b-a22b-2507","name":"Qwen: Qwen3 235B A22B Instruct 2507","created_by":"qwen","source":"official","last_updated":"2026-06-10","family":"qwen3","description":"Qwen3-235B-A22B-Instruct-2507 is a multilingual, instruction-tuned mixture-of-experts language model based on the Qwen3-235B architecture, with 22B active parameters per forward pass.","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.09,"output":0.1},"model_type":"chat","parameters":235,"active_parameters":22,"release_date":"2025-07-21","max_output_tokens":16384,"alias":"qwen/qwen3-235b-a22b","tagline":"Qwen3-235B-A22B-Instruct-2507 is a multilingual, instruction-tuned mixture-of-experts language model based on the Qwen3-235B architecture, with 22B active parameters per forward pass.","tools":["function_calling"]},{"id":"qwen/qwen3-235b-a22b-thinking-2507","name":"Qwen: Qwen3 235B A22B Thinking 2507","created_by":"qwen","source":"official","last_updated":"2026-06-02","family":"qwen3","description":"Qwen3-235B-A22B-Thinking-2507 is a high-performance, open-weight Mixture-of-Experts (MoE) language model optimized for complex reasoning tasks.","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.1,"output":0.1,"cached_input":0.1},"model_type":"chat","parameters":235,"active_parameters":22,"release_date":"2025-07-25","alias":"qwen/qwen3-235b-a22b-thinking","tagline":"Qwen3-235B-A22B-Thinking-2507 is a high-performance, open-weight Mixture-of-Experts (MoE) language model optimized for complex reasoning tasks.","tools":["function_calling"],"max_output_tokens":262144,"status":"deprecated","deprecation_date":"2026-04-22","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-235b-a22b-thinking","name":"Qwen: Qwen3 235B A22B Thinking 2507","created_by":"qwen","source":"official","last_updated":"2026-06-02","family":"qwen3","description":"Qwen3-235B-A22B-Thinking-2507 is a high-performance, open-weight Mixture-of-Experts (MoE) language model optimized for complex reasoning tasks.","release_date":"2025-07-25","context_window":262144,"parameters":235,"active_parameters":22,"model_type":"chat","tagline":"Qwen3-235B-A22B-Thinking-2507 is a high-performance, open-weight Mixture-of-Experts (MoE) language model optimized for complex reasoning tasks.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.1,"output":0.1,"cached_input":0.1},"tools":["function_calling"],"snapshots":["qwen/qwen3-235b-a22b-thinking-2507"],"max_output_tokens":262144,"status":"deprecated","deprecation_date":"2026-04-22","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-235b-a22b","name":"Qwen: Qwen3 235B A22B","created_by":"qwen","source":"official","last_updated":"2026-03-26","family":"qwen3","description":"Qwen3-235B-A22B is a 235B parameter mixture-of-experts (MoE) model developed by Qwen, activating 22B parameters per forward pass.","context_window":131072,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.455,"output":1.82},"model_type":"chat","parameters":235,"active_parameters":22,"release_date":"2025-04-28","tagline":"Qwen3-235B-A22B-Instruct-2507 is a multilingual, instruction-tuned mixture-of-experts language model based on the Qwen3-235B architecture, with 22B active parameters per forward pass.","tools":["function_calling"],"snapshots":["qwen/qwen3-235b-a22b-2507"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-30b-a3b-instruct-2507","name":"Qwen: Qwen3 30B A3B Instruct 2507","created_by":"qwen","source":"official","last_updated":"2026-06-10","family":"qwen3","description":"Qwen3-30B-A3B-Instruct-2507 is a 30.5B-parameter mixture-of-experts language model from Qwen, with 3.3B active parameters per inference.","context_window":131072,"max_output_tokens":32000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.048,"output":0.193},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-07-29","alias":"qwen/qwen3-30b-a3b-instruct","tagline":"Qwen3-30B-A3B-Instruct-2507 is a 30.5B-parameter mixture-of-experts language model from Qwen, with 3.3B active parameters per inference.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-30b-a3b-instruct","name":"Qwen: Qwen3 30B A3B Instruct 2507","created_by":"qwen","source":"official","last_updated":"2026-06-10","family":"qwen3","description":"Qwen3-30B-A3B-Instruct-2507 is a 30.5B-parameter mixture-of-experts language model from Qwen, with 3.3B active parameters per inference.","release_date":"2025-07-29","context_window":131072,"max_output_tokens":32000,"parameters":30,"active_parameters":3,"model_type":"chat","tagline":"Qwen3-30B-A3B-Instruct-2507 is a 30.5B-parameter mixture-of-experts language model from Qwen, with 3.3B active parameters per inference.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.048,"output":0.193},"tools":["function_calling"],"snapshots":["qwen/qwen3-30b-a3b-instruct-2507"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-30b-a3b-thinking-2507","name":"Qwen: Qwen3 30B A3B Thinking 2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-30B-A3B-Thinking-2507 is a 30B parameter Mixture-of-Experts reasoning model optimized for complex tasks requiring extended multi-step thinking.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.08,"output":0.4,"cached_input":0.08},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-08-28","alias":"qwen/qwen3-30b-a3b-thinking","tagline":"Qwen3-30B-A3B-Thinking-2507 is a 30B parameter Mixture-of-Experts reasoning model optimized for complex tasks requiring extended multi-step thinking.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-30b-a3b-thinking","name":"Qwen: Qwen3 30B A3B Thinking 2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-30B-A3B-Thinking-2507 is a 30B parameter Mixture-of-Experts reasoning model optimized for complex tasks requiring extended multi-step thinking.","release_date":"2025-08-28","context_window":131072,"max_output_tokens":131072,"parameters":30,"active_parameters":3,"model_type":"chat","tagline":"Qwen3-30B-A3B-Thinking-2507 is a 30B parameter Mixture-of-Experts reasoning model optimized for complex tasks requiring extended multi-step thinking.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.08,"output":0.4,"cached_input":0.08},"tools":["function_calling"],"snapshots":["qwen/qwen3-30b-a3b-thinking-2507"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-30b-a3b","name":"Qwen: Qwen3 30B A3B","created_by":"qwen","source":"official","last_updated":"2026-06-10","family":"qwen3","description":"Qwen3, the latest generation in the Qwen large language model series, features both dense and mixture-of-experts (MoE) architectures to excel in reasoning, multilingual support, and advanced agent tasks.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.12,"output":0.5},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-04-28","tagline":"Qwen3, the latest generation in the Qwen large language model series, features both dense and mixture-of-experts (MoE) architectures to excel in reasoning, multilingual support, and advanced agent tas","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-06-05","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-32b","name":"Qwen: Qwen3 32B","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-32B is a dense 32.8B parameter causal language model from the Qwen3 series, optimized for both complex reasoning and efficient dialogue.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.08,"output":0.28,"cached_input":0.04},"model_type":"chat","parameters":32,"release_date":"2025-04-28","tagline":"Qwen3-32B is a dense 32.8B parameter causal language model from the Qwen3 series, optimized for both complex reasoning and efficient dialogue.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-4b:free","name":"Qwen: Qwen3 4B (free)","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-4B is a 4 billion parameter dense language model from the Qwen3 series, designed to support both general-purpose and reasoning-intensive tasks.","status":"deprecated","deprecation_date":"2026-03-29","context_window":40960,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"model_type":"chat","release_date":"2025-04-30","tagline":"Qwen3-4B is a 4 billion parameter dense language model from the Qwen3 series, designed to support both general-purpose and reasoning-intensive tasks.","tools":["function_calling"]},{"id":"qwen/qwen3-8b","name":"Qwen: Qwen3 8B","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-8B is a dense 8.2B parameter causal language model from the Qwen3 series, designed for both reasoning-heavy tasks and efficient dialogue.","context_window":131072,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.05,"output":0.4,"cached_input":0.05},"model_type":"chat","parameters":8,"release_date":"2025-04-28","tagline":"Qwen3-8B is a dense 8.2B parameter causal language model from the Qwen3 series, designed for both reasoning-heavy tasks and efficient dialogue.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-coder-30b-a3b-instruct","name":"Qwen: Qwen3 Coder 30B A3B Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-Coder-30B-A3B-Instruct is a 30.5B parameter Mixture-of-Experts (MoE) model with 128 experts (8 active per forward pass), designed for advanced code generation, repository-scale understanding, and agentic tool use.","context_window":160000,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.07,"output":0.27},"model_type":"code","parameters":30,"active_parameters":3,"release_date":"2025-07-31","tagline":"Qwen3-Coder-30B-A3B-Instruct is a 30.5B parameter Mixture-of-Experts (MoE) model with 128 experts (8 active per forward pass), designed for advanced code generation, repository-scale understanding, an","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-coder-flash","name":"Qwen: Qwen3 Coder Flash","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3 Coder Flash is Alibaba's fast and cost efficient version of their proprietary Qwen3 Coder Plus.","context_window":1000000,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.195,"output":0.975,"cached_input":0.039},"model_type":"code","release_date":"2025-09-17","tagline":"Qwen3 Coder Flash is Alibaba's fast and cost efficient version of their proprietary Qwen3 Coder Plus.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-coder:free","name":"Qwen: Qwen3 Coder 480B A35B (free)","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-Coder-480B-A35B-Instruct is a Mixture-of-Experts (MoE) code generation model developed by the Qwen team.","context_window":1048576,"max_output_tokens":262000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true},"model_type":"code","parameters":480,"active_parameters":35,"release_date":"2025-07-23","tagline":"Qwen3-Coder-480B-A35B-Instruct is a Mixture-of-Experts (MoE) code generation model developed by the Qwen team.","tools":["function_calling"]},{"id":"qwen/qwen3-coder-next","name":"Qwen: Qwen3 Coder Next","created_by":"qwen","source":"official","last_updated":"2026-05-07","family":"qwen3","description":"Qwen3-Coder-Next is an open-weight causal language model optimized for coding agents and local development workflows.","context_window":262144,"max_output_tokens":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true,"reasoning":true,"batch":true},"pricing":{"input":0.11,"output":0.8,"cached_input":0.07},"model_type":"code","release_date":"2026-02-04","tagline":"Qwen3-Coder-Next is an open-weight causal language model optimized for coding agents and local development workflows.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-coder-plus","name":"Qwen: Qwen3 Coder Plus","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3 Coder Plus is Alibaba's proprietary version of the Open Source Qwen3 Coder 480B A35B.","context_window":1000000,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true,"reasoning":true,"batch":true},"pricing":{"input":0.65,"output":3.25,"cached_input":0.13},"model_type":"code","release_date":"2025-09-23","tagline":"Qwen3 Coder Plus is Alibaba's proprietary version of the Open Source Qwen3 Coder 480B A35B.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-coder","name":"Qwen: Qwen3 Coder 480B A35B","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-Coder-480B-A35B-Instruct is a Mixture-of-Experts (MoE) code generation model developed by the Qwen team.","context_window":1048576,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.22,"output":1.8,"cached_input":0.022},"model_type":"code","parameters":480,"active_parameters":35,"release_date":"2025-07-23","tagline":"Qwen3-Coder-480B-A35B-Instruct is a Mixture-of-Experts (MoE) code generation model developed by the Qwen team.","tools":["function_calling"],"max_output_tokens":65536},{"id":"qwen/qwen3-max-thinking","name":"Qwen: Qwen3 Max Thinking","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-Max-Thinking is the flagship reasoning model in the Qwen3 series, designed for high-stakes cognitive tasks that require deep, multi-step reasoning.","context_window":262144,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.78,"output":3.9},"model_type":"chat","release_date":"2026-02-09","tagline":"Qwen3-Max-Thinking is the flagship reasoning model in the Qwen3 series, designed for high-stakes cognitive tasks that require deep, multi-step reasoning.","tools":["function_calling"]},{"id":"qwen/qwen3-max","name":"Qwen: Qwen3 Max","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-Max is an updated release built on the Qwen3 series, offering major improvements in reasoning, instruction following, multilingual support, and long-tail knowledge coverage compared to the January 2025 version.","context_window":262144,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"fine_tuning":true,"batch":true},"pricing":{"input":0.78,"output":3.9,"cached_input":0.156},"model_type":"chat","release_date":"2025-09-23","tagline":"Qwen3-Max is an updated release built on the Qwen3 series, offering major improvements in reasoning, instruction following, multilingual support, and long-tail knowledge coverage compared to the Janua","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-next-80b-a3b-instruct:free","name":"Qwen: Qwen3 Next 80B A3B Instruct (free)","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-Next-80B-A3B-Instruct is an instruction-tuned chat model in the Qwen3-Next series optimized for fast, stable responses without “thinking” traces.","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"model_type":"chat","parameters":80,"active_parameters":3,"release_date":"2025-09-11","tagline":"Qwen3-Next-80B-A3B-Instruct is an instruction-tuned chat model in the Qwen3-Next series optimized for fast, stable responses without “thinking” traces.","tools":["function_calling"]},{"id":"qwen/qwen3-next-80b-a3b-instruct","name":"Qwen: Qwen3 Next 80B A3B Instruct","created_by":"qwen","source":"official","last_updated":"2026-04-25","family":"qwen3","description":"Qwen3-Next-80B-A3B-Instruct is an instruction-tuned chat model in the Qwen3-Next series optimized for fast, stable responses without “thinking” traces.","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.09,"output":1.1},"model_type":"chat","parameters":80,"active_parameters":3,"release_date":"2025-09-11","tagline":"Qwen3-Next-80B-A3B-Instruct is an instruction-tuned chat model in the Qwen3-Next series optimized for fast, stable responses without “thinking” traces.","tools":["function_calling"],"max_output_tokens":16384,"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-next-80b-a3b-thinking","name":"Qwen: Qwen3 Next 80B A3B Thinking","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-Next-80B-A3B-Thinking is a reasoning-first chat model in the Qwen3-Next line that outputs structured “thinking” traces by default.","context_window":262144,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.098,"output":0.78},"model_type":"chat","parameters":80,"active_parameters":3,"release_date":"2025-09-11","tagline":"Qwen3-Next-80B-A3B-Thinking is a reasoning-first chat model in the Qwen3-Next line that outputs structured “thinking” traces by default.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-vl-235b-a22b-instruct","name":"Qwen: Qwen3 VL 235B A22B Instruct","created_by":"qwen","source":"official","last_updated":"2026-04-25","family":"qwen3","description":"Qwen3-VL-235B-A22B Instruct is an open-weight multimodal model that unifies strong text generation with visual understanding across images and video.","context_window":262144,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"reasoning":true,"fine_tuning":true},"pricing":{"input":0.2,"output":0.88,"cached_input":0.11},"model_type":"chat","parameters":235,"active_parameters":22,"release_date":"2025-09-23","tagline":"Qwen3-VL-235B-A22B Instruct is an open-weight multimodal model that unifies strong text generation with visual understanding across images and video.","tools":["function_calling"],"max_output_tokens":16384,"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-vl-235b-a22b-thinking","name":"Qwen: Qwen3 VL 235B A22B Thinking","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-VL-235B-A22B Thinking is a multimodal model that unifies strong text generation with visual understanding across images and video.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.26,"output":2.6},"model_type":"chat","parameters":235,"active_parameters":22,"release_date":"2025-09-23","tagline":"Qwen3-VL-235B-A22B Thinking is a multimodal model that unifies strong text generation with visual understanding across images and video.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-vl-30b-a3b-instruct","name":"Qwen: Qwen3 VL 30B A3B Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-VL-30B-A3B-Instruct is a multimodal model that unifies strong text generation with visual understanding for images and videos.","context_window":262144,"max_output_tokens":32768,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"reasoning":true,"fine_tuning":true},"pricing":{"input":0.13,"output":0.52},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-10-06","tagline":"Qwen3-VL-30B-A3B-Instruct is a multimodal model that unifies strong text generation with visual understanding for images and videos.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-vl-30b-a3b-thinking","name":"Qwen: Qwen3 VL 30B A3B Thinking","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-VL-30B-A3B-Thinking is a multimodal model that unifies strong text generation with visual understanding for images and videos.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.13,"output":1.56},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-10-06","tagline":"Qwen3-VL-30B-A3B-Thinking is a multimodal model that unifies strong text generation with visual understanding for images and videos.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-vl-32b-instruct","name":"Qwen: Qwen3 VL 32B Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-VL-32B-Instruct is a large-scale multimodal vision-language model designed for high-precision understanding and reasoning across text, images, and video.","context_window":262144,"max_output_tokens":32768,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"reasoning":true,"fine_tuning":true},"pricing":{"input":0.104,"output":0.416},"model_type":"chat","parameters":32,"release_date":"2025-10-23","tagline":"Qwen3-VL-32B-Instruct is a large-scale multimodal vision-language model designed for high-precision understanding and reasoning across text, images, and video.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-vl-8b-instruct","name":"Qwen: Qwen3 VL 8B Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-VL-8B-Instruct is a multimodal vision-language model from the Qwen3-VL series, built for high-fidelity understanding and reasoning across text, images, and video.","context_window":256000,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"reasoning":true,"fine_tuning":true},"pricing":{"input":0.08,"output":0.5},"model_type":"chat","parameters":8,"release_date":"2025-10-14","tagline":"Qwen3-VL-8B-Instruct is a multimodal vision-language model from the Qwen3-VL series, built for high-fidelity understanding and reasoning across text, images, and video.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-vl-8b-thinking","name":"Qwen: Qwen3 VL 8B Thinking","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-VL-8B-Thinking is the reasoning-optimized variant of the Qwen3-VL-8B multimodal model, designed for advanced visual and textual reasoning across complex scenes, documents, and temporal sequences.","context_window":256000,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.117,"output":1.365},"model_type":"chat","parameters":8,"release_date":"2025-10-14","tagline":"Qwen3-VL-8B-Thinking is the reasoning-optimized variant of the Qwen3-VL-8B multimodal model, designed for advanced visual and textual reasoning across complex scenes, documents, and temporal sequences","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.5-122b-a10b","name":"Qwen: Qwen3.5-122B-A10B","created_by":"qwen","source":"official","last_updated":"2026-05-23","family":"qwen3.5","description":"The Qwen3.5 122B-A10B native vision-language model is built on a hybrid architecture that integrates a linear attention mechanism with a sparse mixture-of-experts model, achieving higher inference efficiency.","context_window":262144,"max_output_tokens":262144,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true,"batch":true},"pricing":{"input":0.26,"output":2.08},"model_type":"chat","parameters":122,"active_parameters":10,"release_date":"2026-02-25","tagline":"The Qwen3.5 122B-A10B native vision-language model is built on a hybrid architecture that integrates a linear attention mechanism with a sparse mixture-of-experts model, achieving higher inference eff","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.5-27b","name":"Qwen: Qwen3.5-27B","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3.5","description":"The Qwen3.5 27B native vision-language Dense model incorporates a linear attention mechanism, delivering fast response times while balancing inference speed and performance.","context_window":262144,"max_output_tokens":65536,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true,"batch":true},"pricing":{"input":0.195,"output":1.56},"model_type":"chat","parameters":27,"release_date":"2026-02-25","tagline":"The Qwen3.5 27B native vision-language Dense model incorporates a linear attention mechanism, delivering fast response times while balancing inference speed and performance.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.5-35b-a3b","name":"Qwen: Qwen3.5-35B-A3B","created_by":"qwen","source":"official","last_updated":"2026-06-29","family":"qwen3.5","description":"The Qwen3.5 Series 35B-A3B is a native vision-language model designed with a hybrid architecture that integrates linear attention mechanisms and a sparse mixture-of-experts model, achieving higher inference efficiency.","context_window":262144,"max_output_tokens":81920,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true,"batch":true},"pricing":{"input":0.14,"output":1,"cached_input":0.05},"model_type":"chat","parameters":35,"active_parameters":3,"release_date":"2026-02-25","tagline":"The Qwen3.5 Series 35B-A3B is a native vision-language model designed with a hybrid architecture that integrates linear attention mechanisms and a sparse mixture-of-experts model, achieving higher inf","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.5-397b-a17b","name":"Qwen: Qwen3.5 397B A17B","created_by":"qwen","source":"official","last_updated":"2026-06-18","family":"qwen3.5","description":"The Qwen3.5 series 397B-A17B native vision-language model is built on a hybrid architecture that integrates a linear attention mechanism with a sparse mixture-of-experts model, achieving higher inference efficiency.","context_window":256000,"max_output_tokens":65536,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true,"batch":true},"pricing":{"input":0.385,"output":2.45,"cached_input":0.195},"model_type":"chat","parameters":397,"active_parameters":17,"release_date":"2026-02-16","tagline":"The Qwen3.5 series 397B-A17B native vision-language model is built on a hybrid architecture that integrates a linear attention mechanism with a sparse mixture-of-experts model, achieving higher infere","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.5-9b","name":"Qwen: Qwen3.5-9B","created_by":"qwen","source":"official","last_updated":"2026-06-10","family":"qwen3.5","description":"Qwen3.5-9B is a multimodal foundation model from the Qwen3.5 family, designed to deliver strong reasoning, coding, and visual understanding in an efficient 9B-parameter architecture.","context_window":262144,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.1,"output":0.15},"model_type":"chat","parameters":9,"release_date":"2026-03-10","tagline":"Qwen3.5-9B is a multimodal foundation model from the Qwen3.5 family, designed to deliver strong reasoning, coding, and visual understanding in an efficient 9B-parameter architecture.","tools":["function_calling"],"max_output_tokens":262144},{"id":"qwen/qwen3.5-flash-02-23","name":"Qwen: Qwen3.5-Flash","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3.5","description":"The Qwen3.5 native vision-language Flash models are built on a hybrid architecture that integrates a linear attention mechanism with a sparse mixture-of-experts model, achieving higher inference efficiency.","context_window":1000000,"max_output_tokens":65536,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.065,"output":0.26},"model_type":"chat","release_date":"2026-02-25","tagline":"The Qwen3.5 native vision-language Flash models are built on a hybrid architecture that integrates a linear attention mechanism with a sparse mixture-of-experts model, achieving higher inference effic","tools":["function_calling"]},{"id":"qwen/qwen3.5-plus-02-15","name":"Qwen: Qwen3.5 Plus 2026-02-15","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3.5","description":"The Qwen3.5 native vision-language series Plus models are built on a hybrid architecture that integrates linear attention mechanisms with sparse mixture-of-experts models, achieving higher inference efficiency.","context_window":1000000,"max_output_tokens":65536,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.26,"output":1.56},"model_type":"chat","release_date":"2026-02-16","tagline":"The Qwen3.5 native vision-language series Plus models are built on a hybrid architecture that integrates linear attention mechanisms with sparse mixture-of-experts models, achieving higher inference e","tools":["function_calling"]},{"id":"qwen/qwen3.5-plus-20260420","name":"Qwen: Qwen3.5 Plus 2026-04-20","created_by":"qwen","source":"official","family":"qwen3.5","description":"Qwen3.5 Plus (April 2026) is a large-scale multimodal language model from Alibaba.","release_date":"2026-04-27","context_window":1000000,"max_output_tokens":65536,"model_type":"chat","alias":"qwen/qwen3.5-plus","tagline":"Qwen3.5 Plus (April 2026) is a large-scale multimodal language model from Alibaba.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.3,"output":1.8},"tools":["function_calling"],"last_updated":"2026-05-17"},{"id":"qwen/qwen3.5-plus","name":"Qwen: Qwen3.5 Plus 2026-04-20","created_by":"qwen","source":"official","family":"qwen3.5","description":"Qwen3.5 Plus (April 2026) is a large-scale multimodal language model from Alibaba.","release_date":"2026-04-27","context_window":1000000,"max_output_tokens":65536,"model_type":"chat","tagline":"Qwen3.5 Plus (April 2026) is a large-scale multimodal language model from Alibaba.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.3,"output":1.8},"tools":["function_calling"],"snapshots":["qwen/qwen3.5-plus-20260420"],"last_updated":"2026-05-17","license":"proprietary","open_weight":false},{"id":"qwen/qwen3.6-27b","name":"Qwen: Qwen3.6 27B","created_by":"qwen","source":"official","family":"qwen3.6","description":"Qwen3.6 27B is a dense 27-billion-parameter language model from the Qwen Team at Alibaba, released in April 2026.","release_date":"2026-04-27","context_window":262144,"max_output_tokens":262140,"parameters":27,"model_type":"chat","tagline":"Qwen3.6 27B is a dense 27-billion-parameter language model from the Qwen Team at Alibaba, released in April 2026.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.26,"output":2.385},"tools":["function_calling"],"last_updated":"2026-06-29","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.6-35b-a3b","name":"Qwen: Qwen3.6 35B A3B","created_by":"qwen","source":"official","family":"qwen3.6","description":"Qwen3.6-35B-A3B is an open-weight multimodal model from Alibaba Cloud with 35 billion total parameters and 3 billion active parameters per token.","release_date":"2026-04-27","context_window":262144,"max_output_tokens":262144,"parameters":35,"active_parameters":3,"model_type":"chat","tagline":"Qwen3.6-35B-A3B is an open-weight multimodal model from Alibaba Cloud with 35 billion total parameters and 3 billion active parameters per token.","capabilities":{"structured_output":true,"reasoning":true,"json_mode":true,"tool_call":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.14,"output":1,"cached_input":0.05},"last_updated":"2026-06-20","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.6-flash","name":"Qwen: Qwen3.6 Flash","created_by":"qwen","source":"official","family":"qwen3.6","description":"Qwen3.6 Flash is a fast, efficient language model from Alibaba's Qwen 3.6 series.","release_date":"2026-04-27","context_window":1000000,"max_output_tokens":65536,"model_type":"chat","tagline":"Qwen3.6 Flash is a fast, efficient language model from Alibaba's Qwen 3.6 series.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true,"batch":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.188,"output":1.125},"tools":["function_calling"],"last_updated":"2026-05-17","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.6-max-preview","name":"Qwen: Qwen3.6 Max Preview","created_by":"qwen","source":"official","family":"qwen3.6","description":"Qwen3.6-Max-Preview is a proprietary frontier model from Alibaba Cloud built on a sparse mixture-of-experts architecture with approximately 1 trillion total parameters.","release_date":"2026-04-27","context_window":262144,"max_output_tokens":65536,"model_type":"chat","tagline":"Qwen3.6-Max-Preview is a proprietary frontier model from Alibaba Cloud built on a sparse mixture-of-experts architecture with approximately 1 trillion total parameters.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true,"batch":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1.04,"output":6.24},"tools":["function_calling"],"last_updated":"2026-05-01","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.6-plus:free","name":"Qwen: Qwen3.6 Plus (free)","created_by":"qwen","source":"official","family":"qwen3.6","description":"Qwen 3.6 Plus builds on a hybrid architecture that combines efficient linear attention with sparse mixture-of-experts routing, enabling strong scalability and high-performance inference.","release_date":"2026-04-02","context_window":1000000,"max_output_tokens":65536,"model_type":"chat","tagline":"Qwen 3.6 Plus builds on a hybrid architecture that combines efficient linear attention with sparse mixture-of-experts routing, enabling strong scalability and high-performance inference.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image","video"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-03"},{"id":"qwen/qwen3.6-plus-preview:free","name":"Qwen: Qwen3.6 Plus Preview (free)","created_by":"qwen","source":"official","family":"qwen3.6","description":"Qwen 3.6 Plus Preview is the next-generation evolution of the Qwen Plus series, featuring an advanced hybrid architecture that improves efficiency and scalability.","release_date":"2026-03-30","context_window":1000000,"max_output_tokens":32000,"model_type":"chat","tagline":"Qwen 3.6 Plus Preview is the next-generation evolution of the Qwen Plus series, featuring an advanced hybrid architecture that improves efficiency and scalability.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-01"},{"id":"qwen/qwen3.6-plus","name":"Qwen: Qwen3.6 Plus","created_by":"qwen","source":"official","family":"qwen3.6","description":"Qwen 3.6 Plus builds on a hybrid architecture that combines efficient linear attention with sparse mixture-of-experts routing, enabling strong scalability and high-performance inference.","release_date":"2026-04-02","context_window":1000000,"max_output_tokens":65536,"model_type":"chat","tagline":"Qwen 3.6 Plus builds on a hybrid architecture that combines efficient linear attention with sparse mixture-of-experts routing, enabling strong scalability and high-performance inference.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true,"batch":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.325,"output":1.95},"tools":["function_calling"],"last_updated":"2026-04-08","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.7-max","name":"Qwen: Qwen3.7 Max","created_by":"qwen","source":"official","family":"qwen3.7","description":"Qwen3.7-Max is the flagship model in Alibaba's Qwen3.7 series.","release_date":"2026-05-21","context_window":1000000,"max_output_tokens":65536,"model_type":"chat","tagline":"Qwen3.7-Max is the flagship model in Alibaba's Qwen3.7 series.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1.25,"output":3.75,"cached_input":0.25},"tools":["function_calling"],"last_updated":"2026-05-29","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.7-plus","name":"Qwen: Qwen3.7 Plus","created_by":"qwen","source":"official","family":"qwen3.7","description":"Qwen3.7-Plus is a cost-effective model in Alibaba's Qwen3.7 series.","release_date":"2026-06-03","context_window":1000000,"max_output_tokens":65536,"model_type":"chat","tagline":"Qwen3.7-Plus is a cost-effective model in Alibaba's Qwen3.7 series.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.32,"output":1.28,"cached_input":0.064},"tools":["function_calling"],"last_updated":"2026-06-18","license":"apache-2.0","open_weight":true},{"id":"qwen/qwq-32b","name":"Qwen: QwQ 32B","created_by":"qwen","source":"official","last_updated":"2026-04-22","family":"qwq","description":"QwQ is the reasoning model of the Qwen series.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.15,"output":0.58},"model_type":"chat","parameters":32,"release_date":"2025-03-05","tagline":"QwQ is the reasoning model of the Qwen series.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-04-29","license":"apache-2.0","open_weight":true},{"id":"reka/reka-edge","name":"Reka Edge","created_by":"reka","source":"official","description":"Reka Edge is an extremely efficient 7B multimodal vision-language model that accepts image/video+text inputs and generates text outputs.","release_date":"2026-03-20","context_window":16384,"max_output_tokens":16384,"tagline":"Reka Edge is an extremely efficient 7B multimodal vision-language model that accepts image/video+text inputs and generates text outputs.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true},"modalities":{"input":["image","text","video"],"output":["text"]},"pricing":{"input":0.1,"output":0.1},"tools":["function_calling"],"last_updated":"2026-03-27","license":"proprietary","open_weight":false},{"id":"rekaai/reka-edge","name":"Reka Edge","created_by":"rekaai","source":"official","description":"Reka Edge is an extremely efficient 7B multimodal vision-language model that accepts image/video+text inputs and generates text outputs.","release_date":"2026-03-20","context_window":16384,"max_output_tokens":16384,"tagline":"Reka Edge is an extremely efficient 7B multimodal vision-language model that accepts image/video+text inputs and generates text outputs.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["image","text","video"],"output":["text"]},"pricing":{"input":0.1,"output":0.1},"tools":["function_calling"],"last_updated":"2026-04-03"},{"id":"rekaai/reka-flash-3","name":"Reka Flash 3","created_by":"rekaai","source":"official","description":"Reka Flash 3 is a general-purpose, instruction-tuned large language model with 21 billion parameters, developed by Reka.","release_date":"2025-03-12","context_window":65536,"max_output_tokens":65536,"tagline":"Reka Flash 3 is a general-purpose, instruction-tuned large language model with 21 billion parameters, developed by Reka.","capabilities":{"reasoning":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.1,"output":0.2},"last_updated":"2026-06-20"},{"id":"relace/relace-apply-3","name":"Relace: Relace Apply 3","created_by":"relace","source":"official","last_updated":"2026-03-23","description":"Relace Apply 3 is a specialized code-patching LLM that merges AI-suggested edits straight into your source files.","context_window":256000,"max_output_tokens":128000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.85,"output":1.25},"release_date":"2025-09-26","tagline":"Relace Apply 3 is a specialized code-patching LLM that merges AI-suggested edits straight into your source files."},{"id":"relace/relace-search","name":"Relace: Relace Search","created_by":"relace","source":"official","last_updated":"2026-06-20","description":"The relace-search model uses 4-12 `view_file` and `grep` tools in parallel to explore a codebase and return relevant files to the user request.","context_window":256000,"max_output_tokens":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":1,"output":3},"model_type":"chat","release_date":"2025-12-08","tagline":"The relace-search model uses 4-12 `view_file` and `grep` tools in parallel to explore a codebase and return relevant files to the user request.","tools":["function_calling"]},{"id":"sakana/fugu-ultra","name":"Sakana: Fugu Ultra","created_by":"sakana","source":"official","description":"Fugu Ultra is the higher-performance model in Sakana AI's Fugu family.","release_date":"2026-06-24","context_window":1000000,"max_output_tokens":128000,"tagline":"Fugu Ultra is the higher-performance model in Sakana AI's Fugu family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5,"output":30,"cached_input":0.5},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"sao10k/l3-euryale-70b","name":"Sao10k: Llama 3 Euryale 70B v2.1","created_by":"sao10k","source":"official","last_updated":"2026-05-29","description":"Euryale 70B v2.1 is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k).","context_window":8192,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":1.48,"output":1.48},"parameters":70,"release_date":"2024-06-18","tagline":"Euryale 70B v2.1 is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k).","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-06-05"},{"id":"sao10k/l3-lunaris-8b","name":"Sao10K: Llama 3 8B Lunaris","created_by":"sao10k","source":"official","last_updated":"2026-04-25","description":"Lunaris 8B is a versatile generalist and roleplaying model based on Llama 3.","context_window":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.04,"output":0.05},"parameters":8,"release_date":"2024-08-13","tagline":"Lunaris 8B is a versatile generalist and roleplaying model based on Llama 3.","max_output_tokens":16384},{"id":"sao10k/l3.1-70b-hanami-x1","name":"Sao10K: Llama 3.1 70B Hanami x1","created_by":"sao10k","source":"official","last_updated":"2026-06-20","description":"This is [Sao10K](/sao10k)'s experiment over [Euryale v2.2](/sao10k/l3.1-euryale-70b).","context_window":16000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":3,"output":3},"parameters":70,"release_date":"2025-01-08","tagline":"This is [Sao10K](/sao10k)'s experiment over [Euryale v2.2](/sao10k/l3.1-euryale-70b).","capabilities":{"structured_output":true,"json_mode":true}},{"id":"sao10k/l3.1-euryale-70b","name":"Sao10K: Llama 3.1 Euryale 70B v2.2","created_by":"sao10k","source":"official","last_updated":"2026-03-24","description":"Euryale L3.1 70B v2.2 is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k).","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.85,"output":0.85},"parameters":70,"release_date":"2024-08-28","tagline":"Euryale L3.1 70B v2.2 is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k).","tools":["function_calling"]},{"id":"sao10k/l3.3-euryale-70b","name":"Sao10K: Llama 3.3 Euryale 70B","created_by":"sao10k","source":"official","last_updated":"2026-03-24","description":"Euryale L3.3 70B is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k).","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.65,"output":0.75},"parameters":70,"release_date":"2024-12-18","tagline":"Euryale L3.3 70B is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k)."},{"id":"stepfun/step-3.5-flash:free","name":"StepFun: Step 3.5 Flash (free)","created_by":"stepfun","source":"official","last_updated":"2026-03-23","description":"Step 3.5 Flash is StepFun's most capable open-source foundation model.","context_window":256000,"max_output_tokens":256000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"release_date":"2026-01-29","tagline":"Step 3.5 Flash is StepFun's most capable open-source foundation model.","tools":["function_calling"]},{"id":"stepfun/step-3.5-flash","name":"StepFun: Step 3.5 Flash","created_by":"stepfun","source":"official","last_updated":"2026-06-29","description":"Step 3.5 Flash is StepFun's most capable open-source foundation model.","context_window":262144,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.09,"output":0.3,"cached_input":0.02},"release_date":"2026-01-29","tagline":"Step 3.5 Flash is StepFun's most capable open-source foundation model.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-06-29","license":"apache-2.0","open_weight":true},{"id":"stepfun/step-3.7-flash","name":"StepFun: Step 3.7 Flash","created_by":"stepfun","source":"official","description":"Step 3.7 Flash is StepFun's latest high-efficiency multimodal Mixture-of-Experts model.","release_date":"2026-05-28","context_window":256000,"max_output_tokens":256000,"tagline":"Step 3.7 Flash is StepFun's latest high-efficiency multimodal Mixture-of-Experts model.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.2,"output":1.15,"cached_input":0.04},"tools":["function_calling"],"last_updated":"2026-06-02"},{"id":"switchpoint/router","name":"Switchpoint Router","created_by":"switchpoint","source":"official","last_updated":"2026-06-20","description":"Switchpoint AI's router instantly analyzes your request and directs it to the optimal AI from an ever-evolving library.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"reasoning":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.85,"output":3.4},"release_date":"2025-07-11","tagline":"Switchpoint AI's router instantly analyzes your request and directs it to the optimal AI from an ever-evolving library."},{"id":"tencent/hunyuan-a13b-instruct","name":"Tencent: Hunyuan A13B Instruct","created_by":"tencent","source":"official","last_updated":"2026-03-24","description":"Hunyuan-A13B is a 13B active parameter Mixture-of-Experts (MoE) language model developed by Tencent, with a total parameter count of 80B and support for reasoning via Chain-of-Thought.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.14,"output":0.57},"release_date":"2025-07-08","tagline":"Hunyuan-A13B is a 13B active parameter Mixture-of-Experts (MoE) language model developed by Tencent, with a total parameter count of 80B and support for reasoning via Chain-of-Thought."},{"id":"tencent/hy3-preview:free","name":"Tencent: Hy3 preview (free)","created_by":"tencent","source":"official","description":"Hy3 preview is a high-efficiency Mixture-of-Experts model from Tencent designed for agentic workflows and production use.","release_date":"2026-04-22","context_window":262144,"max_output_tokens":262144,"tagline":"Hy3 preview is a high-efficiency Mixture-of-Experts model from Tencent designed for agentic workflows and production use.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-25","status":"deprecated","deprecation_date":"2026-05-08"},{"id":"tencent/hy3-preview","name":"Tencent: Hy3 preview","created_by":"tencent","source":"official","description":"Hy3 preview is a high-efficiency Mixture-of-Experts model from Tencent designed for agentic workflows and production use.","release_date":"2026-04-22","context_window":262144,"max_output_tokens":262144,"tagline":"Hy3 preview is a high-efficiency Mixture-of-Experts model from Tencent designed for agentic workflows and production use.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.063,"output":0.21,"cached_input":0.021},"tools":["function_calling"],"last_updated":"2026-06-20"},{"id":"thedrummer/cydonia-24b-v4.1","name":"TheDrummer: Cydonia 24B V4.1","created_by":"thedrummer","source":"official","last_updated":"2026-06-18","description":"Uncensored and creative writing model based on Mistral Small 3.2 24B with good recall, prompt adherence, and intelligence.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.3,"output":0.5,"cached_input":0.15},"parameters":24,"release_date":"2025-09-27","tagline":"Uncensored and creative writing model based on Mistral Small 3.2 24B with good recall, prompt adherence, and intelligence.","capabilities":{"structured_output":true,"json_mode":true}},{"id":"thedrummer/rocinante-12b","name":"TheDrummer: Rocinante 12B","created_by":"thedrummer","source":"official","last_updated":"2026-06-29","description":"Rocinante 12B is designed for engaging storytelling and rich prose.","context_window":32768,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.25,"output":0.5},"parameters":12,"release_date":"2024-09-30","tagline":"Rocinante 12B is designed for engaging storytelling and rich prose.","tools":["function_calling"]},{"id":"thedrummer/skyfall-36b-v2","name":"TheDrummer: Skyfall 36B V2","created_by":"thedrummer","source":"official","last_updated":"2026-06-20","description":"Skyfall 36B v2 is an enhanced iteration of Mistral Small 2501, specifically fine-tuned for improved creativity, nuanced writing, role-playing, and coherent storytelling.","context_window":32768,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.55,"output":0.8,"cached_input":0.25},"parameters":36,"release_date":"2025-03-10","tagline":"Skyfall 36B v2 is an enhanced iteration of Mistral Small 2501, specifically fine-tuned for improved creativity, nuanced writing, role-playing, and coherent storytelling.","capabilities":{"structured_output":true,"json_mode":true}},{"id":"thedrummer/unslopnemo-12b","name":"TheDrummer: UnslopNemo 12B","created_by":"thedrummer","source":"official","last_updated":"2026-03-24","description":"UnslopNemo v4.1 is the latest addition from the creator of Rocinante, designed for adventure writing and role-play scenarios.","context_window":32768,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.4,"output":0.4},"parameters":12,"release_date":"2024-11-08","tagline":"UnslopNemo v4.1 is the latest addition from the creator of Rocinante, designed for adventure writing and role-play scenarios.","tools":["function_calling"]},{"id":"tngtech/deepseek-r1t2-chimera","name":"TNG: DeepSeek R1T2 Chimera","created_by":"tngtech","source":"official","last_updated":"2026-03-24","family":"deepseek-r1","description":"DeepSeek-TNG-R1T2-Chimera is the second-generation Chimera model from TNG Tech.","context_window":163840,"max_output_tokens":163840,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.3,"output":1.1,"cached_input":0.15},"model_type":"reasoning","release_date":"2025-07-08","tagline":"DeepSeek-TNG-R1T2-Chimera is the second-generation Chimera model from TNG Tech.","tools":["function_calling"]},{"id":"undi95/remm-slerp-l2-13b","name":"ReMM SLERP 13B","created_by":"undi95","source":"official","last_updated":"2026-03-24","description":"A recreation trial of the original MythoMax-L2-B13 but with updated models.","context_window":6144,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.45,"output":0.65},"parameters":13,"release_date":"2023-07-22","tagline":"A recreation trial of the original MythoMax-L2-B13 but with updated models."},{"id":"upstage/solar-pro-3","name":"Upstage: Solar Pro 3","created_by":"upstage","source":"official","last_updated":"2026-03-24","description":"Solar Pro 3 is Upstage's powerful Mixture-of-Experts (MoE) language model.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.15,"output":0.6,"cached_input":0.015},"release_date":"2026-01-27","tagline":"Solar Pro 3 is Upstage's powerful Mixture-of-Experts (MoE) language model.","tools":["function_calling"]},{"id":"writer/palmyra-x5","name":"Writer: Palmyra X5","created_by":"writer","source":"official","last_updated":"2026-03-23","description":"Palmyra X5 is Writer's most advanced model, purpose-built for building and scaling AI agents across the enterprise.","context_window":1040000,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.6,"output":6},"model_type":"chat","release_date":"2026-01-21","tagline":"Palmyra X5 is Writer's most advanced model, purpose-built for building and scaling AI agents across the enterprise.","license":"proprietary","open_weight":false,"capabilities":{"vision":true,"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true}},{"id":"x-ai/grok-3-beta","name":"xAI: Grok 3 Beta","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-3","description":"Grok 3 is the latest model from xAI.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":3,"output":15,"cached_input":0.75},"model_type":"chat","release_date":"2025-04-09","tagline":"Grok 3 is the latest model from xAI.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15"},{"id":"x-ai/grok-3-mini-beta","name":"xAI: Grok 3 Mini Beta","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-3","description":"Grok 3 Mini is a lightweight, smaller thinking model.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.3,"output":0.5,"cached_input":0.075},"model_type":"chat","release_date":"2025-04-09","tagline":"Grok 3 Mini is a lightweight, smaller thinking model.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15"},{"id":"x-ai/grok-3-mini","name":"xAI: Grok 3 Mini","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-3","description":"A lightweight model that thinks before responding.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true},"pricing":{"input":0.3,"output":0.5,"cached_input":0.075},"model_type":"chat","release_date":"2025-06-10","tagline":"A lightweight model that thinks before responding.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15","knowledge_cutoff":"2024-11","license":"proprietary","open_weight":false},{"id":"x-ai/grok-3","name":"xAI: Grok 3","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-3","description":"Grok 3 is the latest model from xAI.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"batch":true},"pricing":{"input":3,"output":15,"cached_input":0.75},"model_type":"chat","release_date":"2025-06-10","tagline":"Grok 3 is the latest model from xAI.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15","knowledge_cutoff":"2024-11","license":"proprietary","open_weight":false},{"id":"x-ai/grok-4-fast","name":"xAI: Grok 4 Fast","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-4","description":"Grok 4 Fast is xAI's latest multimodal model with SOTA cost-efficiency and a 2M token context window.","context_window":2000000,"max_output_tokens":30000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.2,"output":0.5,"cached_input":0.05},"model_type":"chat","release_date":"2025-09-19","tagline":"Grok 4 Fast is xAI's latest multimodal model with SOTA cost-efficiency and a 2M token context window.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15"},{"id":"x-ai/grok-4.1-fast","name":"xAI: Grok 4.1 Fast","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-4.1","description":"Grok 4.1 Fast is xAI's best agentic tool calling model that shines in real-world use cases like customer support and deep research.","context_window":2000000,"max_output_tokens":30000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.2,"output":0.5,"cached_input":0.05},"model_type":"chat","release_date":"2025-11-19","tagline":"Grok 4.1 Fast is xAI's best agentic tool calling model that shines in real-world use cases like customer support and deep research.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15"},{"id":"x-ai/grok-4.20-beta","name":"xAI: Grok 4.20 Beta","created_by":"xai","source":"official","last_updated":"2026-03-24","family":"grok-4.20","description":"Grok 4.20 Beta is xAI's newest flagship model with industry-leading speed and agentic tool calling capabilities.","context_window":2000000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":2,"output":6,"cached_input":0.2},"model_type":"chat","release_date":"2026-03-12","tagline":"Grok 4.20 Beta is xAI's newest flagship model with industry-leading speed and agentic tool calling capabilities.","tools":["function_calling"]},{"id":"x-ai/grok-4.20-multi-agent-beta","name":"xAI: Grok 4.20 Multi-Agent Beta","created_by":"xai","source":"official","last_updated":"2026-03-24","family":"grok-4.20","description":"Grok 4.20 Multi-Agent Beta is a variant of xAI’s Grok 4.20 designed for collaborative, agent-based workflows.","context_window":2000000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":2,"output":6,"cached_input":0.2},"model_type":"chat","release_date":"2026-03-12","tagline":"Grok 4.20 Multi-Agent Beta is a variant of xAI’s Grok 4.20 designed for collaborative, agent-based workflows."},{"id":"x-ai/grok-4.20-multi-agent","name":"xAI: Grok 4.20 Multi-Agent","created_by":"xai","source":"official","family":"grok-4.20","description":"Grok 4.20 Multi-Agent is a variant of xAI’s Grok 4.20 designed for collaborative, agent-based workflows.","release_date":"2026-03-31","context_window":2000000,"model_type":"chat","tagline":"Grok 4.20 Multi-Agent is a variant of xAI’s Grok 4.20 designed for collaborative, agent-based workflows.","capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":2.5,"cached_input":0.2},"last_updated":"2026-06-18"},{"id":"x-ai/grok-4.20","name":"xAI: Grok 4.20","created_by":"xai","source":"official","family":"grok-4.20","description":"Grok 4.20 is a reasoning model from xAI with industry-leading speed and agentic tool calling capabilities.","release_date":"2026-03-31","context_window":2000000,"model_type":"chat","tagline":"Grok 4.20 is xAI's newest flagship model with industry-leading speed and agentic tool calling capabilities.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":2.5,"cached_input":0.2},"tools":["function_calling"],"last_updated":"2026-05-10"},{"id":"x-ai/grok-4.3","name":"xAI: Grok 4.3","created_by":"xai","source":"official","family":"grok-4.3","description":"Grok 4.3 is a reasoning model from xAI.","release_date":"2026-04-30","context_window":1000000,"model_type":"chat","tagline":"Grok 4.3 is a reasoning model from xAI.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":2.5,"cached_input":0.2},"tools":["function_calling"],"last_updated":"2026-05-01","knowledge_cutoff":"2024-11","license":"proprietary","open_weight":false},{"id":"x-ai/grok-4","name":"xAI: Grok 4","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-4","description":"Grok 4 is xAI's latest reasoning model with a 256k context window.","context_window":256000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":3,"output":15,"cached_input":0.75},"model_type":"chat","release_date":"2025-07-09","tagline":"Grok 4 is xAI's latest reasoning model with a 256k context window.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15"},{"id":"x-ai/grok-build-0.1","name":"xAI: Grok Build 0.1","created_by":"xai","source":"official","description":"Grok Build 0.1 is xAI’s fast coding model trained specifically for agentic software engineering workflows.","release_date":"2026-05-20","context_window":256000,"model_type":"chat","tagline":"Grok Build 0.1 is xAI’s fast coding model trained specifically for agentic software engineering workflows.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1,"output":2,"cached_input":0.2},"tools":["function_calling"],"last_updated":"2026-05-23","license":"proprietary","open_weight":false},{"id":"x-ai/grok-code-fast-1","name":"xAI: Grok Code Fast 1","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-code","description":"Grok Code Fast 1 is a speedy and economical reasoning model that excels at agentic coding.","context_window":256000,"max_output_tokens":10000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true},"pricing":{"input":0.2,"output":1.5,"cached_input":0.02},"model_type":"code","release_date":"2025-08-26","tagline":"Grok Code Fast 1 is a speedy and economical reasoning model that excels at agentic coding.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15","license":"proprietary","open_weight":false},{"id":"xiaomi/mimo-v2-flash","name":"Xiaomi: MiMo-V2-Flash","created_by":"xiaomi","source":"official","last_updated":"2026-05-10","description":"MiMo-V2-Flash is an open-source foundation language model developed by Xiaomi.","context_window":262144,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.1,"output":0.3,"cached_input":0.01},"release_date":"2025-12-14","tagline":"MiMo-V2-Flash is an open-source foundation language model developed by Xiaomi.","tools":["function_calling"],"family":"mimo","model_type":"chat","knowledge_cutoff":"2024-12","license":"mit","parameters":309,"active_parameters":15,"architecture":"moe","open_weight":true},{"id":"xiaomi/mimo-v2-omni","name":"Xiaomi: MiMo-V2-Omni","created_by":"xiaomi","source":"official","last_updated":"2026-05-29","description":"MiMo-V2-Omni is a frontier omni-modal model that natively processes image, video, and audio inputs within a unified architecture.","context_window":262144,"max_output_tokens":65536,"modalities":{"input":["text","audio","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true},"pricing":{"input":0.4,"output":2,"cached_input":0.08},"release_date":"2026-03-18","tagline":"MiMo-V2-Omni is a frontier omni-modal model that natively processes image, video, and audio inputs within a unified architecture.","tools":["function_calling"],"family":"mimo","model_type":"chat","status":"deprecated","deprecation_date":"2026-05-31","license":"proprietary","open_weight":false},{"id":"xiaomi/mimo-v2-pro","name":"Xiaomi: MiMo-V2-Pro","created_by":"xiaomi","source":"official","last_updated":"2026-05-29","description":"MiMo-V2-Pro is Xiaomi's flagship foundation model, featuring over 1T total parameters and a 1M context length, deeply optimized for agentic scenarios.","context_window":1048576,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true},"pricing":{"input":1,"output":3,"cached_input":0.2},"release_date":"2026-03-18","tagline":"MiMo-V2-Pro is Xiaomi's flagship foundation model, featuring over 1T total parameters and a 1M context length, deeply optimized for agentic scenarios.","tools":["function_calling"],"family":"mimo","model_type":"chat","status":"deprecated","deprecation_date":"2026-05-31","license":"proprietary","parameters":1000,"active_parameters":42,"architecture":"moe","open_weight":false},{"id":"xiaomi/mimo-v2.5-pro","name":"Xiaomi: MiMo-V2.5-Pro","created_by":"xiaomi","source":"official","family":"mimo","description":"MiMo-V2.5-Pro is Xiaomi’s flagship model, delivering strong performance in general agentic capabilities, complex software engineering, and long-horizon tasks, with top rankings on benchmarks such as C","release_date":"2026-04-22","context_window":1048576,"max_output_tokens":131072,"model_type":"chat","tagline":"MiMo-V2.5-Pro is Xiaomi’s flagship model, delivering strong performance in general agentic capabilities, complex software engineering, and long-horizon tasks, with top rankings on benchmarks such as C","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.435,"output":0.87,"cached_input":0.004},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"xiaomi/mimo-v2.5","name":"Xiaomi: MiMo-V2.5","created_by":"xiaomi","source":"official","family":"mimo","description":"MiMo-V2.5 is a native omnimodal model by Xiaomi.","release_date":"2026-04-22","context_window":1048576,"max_output_tokens":131072,"model_type":"chat","tagline":"MiMo-V2.5 is a native omnimodal model by Xiaomi.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true},"modalities":{"input":["text","audio","image","video"],"output":["text"]},"pricing":{"input":0.105,"output":0.28,"cached_input":0.003},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"z-ai/glm-4-32b","name":"Z.ai: GLM 4 32B ","created_by":"z-ai","source":"official","last_updated":"2026-03-23","description":"GLM 4 32B is a cost-effective foundation language model.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":0.1,"output":0.1},"family":"glm-4","model_type":"chat","parameters":32,"release_date":"2025-07-24","tagline":"GLM 4 32B is a cost-effective foundation language model.","tools":["function_calling"]},{"id":"z-ai/glm-4.5-air:free","name":"Z.ai: GLM 4.5 Air (free)","created_by":"z-ai","source":"official","last_updated":"2026-03-23","description":"GLM-4.5-Air is the lightweight variant of our latest flagship model family, also purpose-built for agent-centric applications.","context_window":131072,"max_output_tokens":96000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"family":"glm-4.5","model_type":"chat","release_date":"2025-07-25","tagline":"GLM-4.5-Air is the lightweight variant of our latest flagship model family, also purpose-built for agent-centric applications.","tools":["function_calling"]},{"id":"z-ai/glm-4.5-air","name":"Z.ai: GLM 4.5 Air","created_by":"z-ai","source":"official","last_updated":"2026-06-18","description":"GLM-4.5-Air is the lightweight variant of our latest flagship model family, also purpose-built for agent-centric applications.","context_window":131072,"max_output_tokens":98304,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.13,"output":0.85,"cached_input":0.025},"family":"glm-4.5","model_type":"chat","release_date":"2025-07-25","tagline":"GLM-4.5-Air is the lightweight variant of our latest flagship model family, also purpose-built for agent-centric applications.","tools":["function_calling"]},{"id":"z-ai/glm-4.5","name":"Z.ai: GLM 4.5","created_by":"z-ai","source":"official","last_updated":"2026-06-20","description":"GLM-4.5 is our latest flagship foundation model, purpose-built for agent-based applications.","context_window":131072,"max_output_tokens":98304,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.6,"output":2.2,"cached_input":0.11},"family":"glm-4.5","model_type":"chat","release_date":"2025-07-25","tagline":"GLM-4.5 is our latest flagship foundation model, purpose-built for agent-based applications.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-12-31"},{"id":"z-ai/glm-4.5v","name":"Z.ai: GLM 4.5V","created_by":"z-ai","source":"official","last_updated":"2026-03-24","description":"GLM-4.5V is a vision-language foundation model for multimodal agent applications.","context_window":65536,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.6,"output":1.8,"cached_input":0.11},"family":"glm-4.5","model_type":"chat","release_date":"2025-08-11","tagline":"GLM-4.5V is a vision-language foundation model for multimodal agent applications.","tools":["function_calling"]},{"id":"z-ai/glm-4.6","name":"Z.ai: GLM 4.6","created_by":"z-ai","source":"official","last_updated":"2026-05-14","description":"Compared with GLM-4.5, this generation brings several key improvements: Longer context window: The context window has been expanded from 128K to 200K tokens, enabling the model to handle more complex.","context_window":202752,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.43,"output":1.74,"cached_input":0.08},"family":"glm-4.6","model_type":"chat","release_date":"2025-09-30","tagline":"Compared with GLM-4.5, this generation brings several key improvements:\n\nLonger context window: The context window has been expanded from 128K to 200K tokens, enabling the model to handle more complex","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-14"},{"id":"z-ai/glm-4.6v","name":"Z.ai: GLM 4.6V","created_by":"z-ai","source":"official","last_updated":"2026-06-10","description":"GLM-4.6V is a large multimodal model designed for high-fidelity visual understanding and long-context reasoning across images, documents, and mixed media.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["image","text","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.3,"output":0.9,"cached_input":0.055},"family":"glm-4.6","model_type":"chat","release_date":"2025-12-08","tagline":"GLM-4.6V is a large multimodal model designed for high-fidelity visual understanding and long-context reasoning across images, documents, and mixed media.","tools":["function_calling"]},{"id":"z-ai/glm-4.7-flash","name":"Z.ai: GLM 4.7 Flash","created_by":"z-ai","source":"official","last_updated":"2026-04-25","description":"As a 30B-class SOTA model, GLM-4.7-Flash offers a new option that balances performance and efficiency.","context_window":202752,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.06,"output":0.4,"cached_input":0.01},"family":"glm-4.7","model_type":"chat","release_date":"2026-01-19","tagline":"As a 30B-class SOTA model, GLM-4.7-Flash offers a new option that balances performance and efficiency.","tools":["function_calling"],"max_output_tokens":16384},{"id":"z-ai/glm-4.7","name":"Z.ai: GLM 4.7","created_by":"z-ai","source":"official","last_updated":"2026-05-10","description":"GLM-4.7 is Z.ai’s latest flagship model, featuring upgrades in two key areas: enhanced programming capabilities and more stable multi-step reasoning/execution.","context_window":202752,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.4,"output":1.75,"cached_input":0.08},"family":"glm-4.7","model_type":"chat","release_date":"2025-12-22","tagline":"GLM-4.7 is Z.ai’s latest flagship model, featuring upgrades in two key areas: enhanced programming capabilities and more stable multi-step reasoning/execution.","tools":["function_calling"]},{"id":"z-ai/glm-5-turbo","name":"Z.ai: GLM 5 Turbo","created_by":"z-ai","source":"official","last_updated":"2026-06-10","description":"GLM-5 Turbo is a new model from Z.ai designed for fast inference and strong performance in agent-driven environments such as OpenClaw scenarios.","context_window":262144,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":1.2,"output":4,"cached_input":0.24},"family":"glm-5","model_type":"chat","release_date":"2026-03-15","tagline":"GLM-5 Turbo is a new model from Z.ai designed for fast inference and strong performance in agent-driven environments such as OpenClaw scenarios.","tools":["function_calling"]},{"id":"z-ai/glm-5.1","name":"Z.ai: GLM 5.1","created_by":"z-ai","source":"official","family":"glm-5.1","description":"GLM-5.1 delivers a major leap in coding capability, with particularly significant gains in handling long-horizon tasks.","release_date":"2026-04-07","context_window":202752,"model_type":"chat","tagline":"GLM-5.1 delivers a major leap in coding capability, with particularly significant gains in handling long-horizon tasks.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.98,"output":3.08,"cached_input":0.182},"tools":["function_calling"],"last_updated":"2026-06-02","max_output_tokens":131072},{"id":"z-ai/glm-5.2","name":"Z.ai: GLM 5.2","created_by":"z-ai","source":"official","family":"glm-5.2","description":"GLM 5.2 is a large-scale reasoning model from Z.ai.","release_date":"2026-06-16","context_window":1048576,"max_output_tokens":32768,"model_type":"chat","tagline":"GLM 5.2 is a large-scale reasoning model from Z.ai.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.95,"output":3,"cached_input":0.18},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"z-ai/glm-5","name":"Z.ai: GLM 5","created_by":"z-ai","source":"official","last_updated":"2026-06-03","description":"GLM-5 is Z.ai’s flagship open-source foundation model engineered for complex systems design and long-horizon agent workflows.","context_window":202752,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.6,"output":1.92,"cached_input":0.12},"family":"glm-5","model_type":"chat","release_date":"2026-02-11","tagline":"GLM-5 is Z.ai’s flagship open-source foundation model engineered for complex systems design and long-horizon agent workflows.","tools":["function_calling"]},{"id":"z-ai/glm-5v-turbo","name":"Z.ai: GLM 5V Turbo","created_by":"z-ai","source":"official","family":"glm-5","description":"GLM-5V-Turbo is Z.ai’s first native multimodal agent foundation model, built for vision-based coding and agent-driven tasks.","release_date":"2026-04-01","context_window":202752,"max_output_tokens":131072,"model_type":"chat","tagline":"GLM-5V-Turbo is Z.ai’s first native multimodal agent foundation model, built for vision-based coding and agent-driven tasks.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["image","text","video"],"output":["text"]},"pricing":{"input":1.2,"output":4,"cached_input":0.24},"tools":["function_calling"],"last_updated":"2026-06-29","status":"deprecated","deprecation_date":"2098-12-31"}]}; +export const provider: ProviderWithModels = {"id":"openrouter","name":"OpenRouter","region":"US","headquarters":"New York, NY","founded":2023,"url":"https://openrouter.ai","api_url":"https://openrouter.ai/api/v1","docs_url":"https://openrouter.ai/docs","pricing_url":"https://openrouter.ai/models","description":"Unified API gateway providing access to 200+ models from multiple providers with standardized pricing.","type":"aggregator","playground_url":"https://openrouter.ai/playground","status_url":"https://status.openrouter.ai","openai_compatible":true,"free_tier":true,"github_url":"https://github.com/OpenRouterTeam","models_url":"https://openrouter.ai/models","twitter_url":"https://x.com/OpenRouterAI","discord_url":"https://discord.com/invite/openrouter","terms_url":"https://openrouter.ai/terms","support_url":"https://openrouter.ai/support","icon":"\n \n","models":[{"id":"~anthropic/claude-fable-latest","name":"Anthropic: Claude Fable Latest","created_by":"~anthropic","source":"official","family":"claude-fable","description":"This model always redirects to the latest model in the Claude Fable family.","release_date":"2026-06-09","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"This model always redirects to the latest model in the Claude Fable family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":10,"output":50,"cached_input":1},"tools":["function_calling"],"last_updated":"2026-06-18"},{"id":"~anthropic/claude-haiku-latest","name":"Anthropic Claude Haiku Latest","created_by":"~anthropic","source":"official","family":"claude-haiku","description":"This model always redirects to the latest model in the Anthropic Claude Haiku family.","release_date":"2026-04-27","context_window":200000,"max_output_tokens":64000,"model_type":"chat","tagline":"This model always redirects to the latest model in the Anthropic Claude Haiku family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1,"output":5,"cached_input":0.1},"tools":["function_calling"],"last_updated":"2026-05-14"},{"id":"~anthropic/claude-opus-latest","name":"Anthropic: Claude Opus Latest","created_by":"~anthropic","source":"official","family":"claude-opus","description":"This model always redirects to the latest model in the Claude Opus family.","release_date":"2026-04-21","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"This model always redirects to the latest model in the Claude Opus family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5,"output":25,"cached_input":0.5},"tools":["function_calling"],"last_updated":"2026-04-22"},{"id":"~anthropic/claude-sonnet-latest","name":"Anthropic Claude Sonnet Latest","created_by":"~anthropic","source":"official","family":"claude-sonnet","description":"This model always redirects to the latest model in the Anthropic Claude Sonnet family.","release_date":"2026-04-27","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"This model always redirects to the latest model in the Anthropic Claude Sonnet family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":3,"output":15,"cached_input":0.3},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"~google/gemini-flash-latest","name":"Google Gemini Flash Latest","created_by":"~google","source":"official","description":"This model always redirects to the latest model in the Google Gemini Flash family.","release_date":"2026-04-27","context_window":1048576,"max_output_tokens":65536,"model_type":"chat","tagline":"This model always redirects to the latest model in the Google Gemini Flash family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"pricing":{"input":1.5,"output":9,"cached_input":0.15},"tools":["function_calling"],"last_updated":"2026-05-23"},{"id":"~google/gemini-pro-latest","name":"Google Gemini Pro Latest","created_by":"~google","source":"official","description":"This model always redirects to the latest model in the Google Gemini Pro family.","release_date":"2026-04-27","context_window":1048576,"max_output_tokens":65536,"model_type":"chat","tagline":"This model always redirects to the latest model in the Google Gemini Pro family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["audio","image","text","video"],"output":["text"]},"pricing":{"input":2,"output":12,"cached_input":0.2},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"~moonshotai/kimi-latest","name":"MoonshotAI Kimi Latest","created_by":"~moonshotai","source":"official","family":"kimi","description":"This model always redirects to the latest model in the MoonshotAI Kimi family.","release_date":"2026-04-27","context_window":262144,"max_output_tokens":262144,"model_type":"chat","tagline":"This model always redirects to the latest model in the MoonshotAI Kimi family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.55,"output":3.2,"cached_input":0.11},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"~openai/gpt-latest","name":"OpenAI GPT Latest","created_by":"~openai","source":"official","description":"This model always redirects to the latest model in the OpenAI GPT family.","release_date":"2026-04-27","context_window":1050000,"max_output_tokens":128000,"tagline":"This model always redirects to the latest model in the OpenAI GPT family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["image","text"],"output":["text"]},"pricing":{"input":5,"output":30,"cached_input":0.5},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"~openai/gpt-mini-latest","name":"OpenAI GPT Mini Latest","created_by":"~openai","source":"official","description":"This model always redirects to the latest model in the OpenAI GPT Mini family.","release_date":"2026-04-27","context_window":400000,"max_output_tokens":128000,"tagline":"This model always redirects to the latest model in the OpenAI GPT Mini family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["image","text"],"output":["text"]},"pricing":{"input":0.75,"output":4.5,"cached_input":0.075},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"ai21/jamba-large-1.7","name":"AI21: Jamba Large 1.7","created_by":"ai21","source":"official","last_updated":"2026-03-24","description":"Jamba Large 1.7 is the latest model in the Jamba open family, offering improvements in grounding, instruction-following, and overall efficiency.","context_window":256000,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":2,"output":8},"model_type":"chat","release_date":"2025-08-08","tagline":"Jamba Large 1.7 is the latest model in the Jamba open family, offering improvements in grounding, instruction-following, and overall efficiency.","tools":["function_calling"]},{"id":"aion-labs/aion-1.0-mini","name":"AionLabs: Aion-1.0-Mini","created_by":"aion-labs","source":"official","last_updated":"2026-03-23","description":"Aion-1.0-Mini 32B parameter model is a distilled version of the DeepSeek-R1 model, designed for strong performance in reasoning domains such as mathematics, coding, and logic.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"reasoning":true},"pricing":{"input":0.7,"output":1.4},"release_date":"2025-02-04","tagline":"Aion-1.0-Mini 32B parameter model is a distilled version of the DeepSeek-R1 model, designed for strong performance in reasoning domains such as mathematics, coding, and logic."},{"id":"aion-labs/aion-1.0","name":"AionLabs: Aion-1.0","created_by":"aion-labs","source":"official","last_updated":"2026-03-23","description":"Aion-1.0 is a multi-model system designed for high performance across various tasks, including reasoning and coding.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"reasoning":true},"pricing":{"input":4,"output":8},"release_date":"2025-02-04","tagline":"Aion-1.0 is a multi-model system designed for high performance across various tasks, including reasoning and coding."},{"id":"aion-labs/aion-2.0","name":"AionLabs: Aion-2.0","created_by":"aion-labs","source":"official","last_updated":"2026-03-23","description":"Aion-2.0 is a variant of DeepSeek V3.2 optimized for immersive roleplaying and storytelling.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"reasoning":true},"pricing":{"input":0.8,"output":1.6,"cached_input":0.2},"release_date":"2026-02-23","tagline":"Aion-2.0 is a variant of DeepSeek V3.2 optimized for immersive roleplaying and storytelling."},{"id":"aion-labs/aion-rp-llama-3.1-8b","name":"AionLabs: Aion-RP 1.0 (8B)","created_by":"aion-labs","source":"official","last_updated":"2026-03-23","description":"Aion-RP-Llama-3.1-8B ranks the highest in the character evaluation portion of the RPBench-Auto benchmark, a roleplaying-specific variant of Arena-Hard-Auto, where LLMs evaluate each other’s responses.","context_window":32768,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.8,"output":1.6},"parameters":8,"release_date":"2025-02-04","tagline":"Aion-RP-Llama-3.1-8B ranks the highest in the character evaluation portion of the RPBench-Auto benchmark, a roleplaying-specific variant of Arena-Hard-Auto, where LLMs evaluate each other’s responses."},{"id":"alfredpros/codellama-7b-instruct-solidity","name":"AlfredPros: CodeLLaMa 7B Instruct Solidity","created_by":"alfredpros","source":"official","last_updated":"2026-03-23","description":"A finetuned 7 billion parameters Code LLaMA - Instruct model to generate Solidity smart contract using 4-bit QLoRA finetuning provided by PEFT library.","context_window":4096,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.8,"output":1.2},"family":"codellama","model_type":"code","parameters":7,"release_date":"2025-04-14","tagline":"A finetuned 7 billion parameters Code LLaMA - Instruct model to generate Solidity smart contract using 4-bit QLoRA finetuning provided by PEFT library."},{"id":"alibaba/tongyi-deepresearch-30b-a3b","name":"Tongyi DeepResearch 30B A3B","created_by":"alibaba","source":"official","last_updated":"2026-03-24","description":"Tongyi DeepResearch is an agentic large language model developed by Tongyi Lab, with 30 billion total parameters activating only 3 billion per token.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.09,"output":0.45,"cached_input":0.09},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-09-18","tagline":"Tongyi DeepResearch is an agentic large language model developed by Tongyi Lab, with 30 billion total parameters activating only 3 billion per token.","tools":["function_calling"]},{"id":"allenai/molmo-2-8b","name":"AllenAI: Molmo2 8B","created_by":"allenai","source":"official","last_updated":"2026-03-21","description":"Molmo2-8B is an open vision-language model developed by the Allen Institute for AI (Ai2) as part of the Molmo2 family, supporting image, video, and multi-image understanding and grounding.","status":"deprecated","deprecation_date":"2026-03-23","context_window":36864,"max_output_tokens":36864,"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.2,"output":0.2},"parameters":8},{"id":"allenai/olmo-2-0325-32b-instruct","name":"AllenAI: Olmo 2 32B Instruct","created_by":"allenai","source":"official","last_updated":"2026-03-23","description":"OLMo-2 32B Instruct is a supervised instruction-finetuned variant of the OLMo-2 32B March 2025 base model.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.05,"output":0.2},"parameters":32,"release_date":"2025-03-14","tagline":"OLMo-2 32B Instruct is a supervised instruction-finetuned variant of the OLMo-2 32B March 2025 base model."},{"id":"allenai/olmo-3-32b-think","name":"AllenAI: Olmo 3 32B Think","created_by":"allenai","source":"official","last_updated":"2026-03-24","description":"Olmo 3 32B Think is a large-scale, 32-billion-parameter model purpose-built for deep reasoning, complex logic chains and advanced instruction-following scenarios.","context_window":65536,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.15,"output":0.5},"parameters":32,"release_date":"2025-11-21","tagline":"Olmo 3 32B Think is a large-scale, 32-billion-parameter model purpose-built for deep reasoning, complex logic chains and advanced instruction-following scenarios."},{"id":"allenai/olmo-3-7b-instruct","name":"AllenAI: Olmo 3 7B Instruct","created_by":"allenai","source":"official","last_updated":"2026-03-21","description":"Olmo 3 7B Instruct is a supervised instruction-fine-tuned variant of the Olmo 3 7B base model, optimized for instruction-following, question-answering, and natural conversational dialogue.","status":"deprecated","deprecation_date":"2026-03-23","context_window":65536,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.1,"output":0.2},"parameters":7},{"id":"allenai/olmo-3-7b-think","name":"AllenAI: Olmo 3 7B Think","created_by":"allenai","source":"official","last_updated":"2026-03-21","description":"Olmo 3 7B Think is a research-oriented language model in the Olmo family designed for advanced reasoning and instruction-driven tasks.","status":"deprecated","deprecation_date":"2026-03-23","context_window":65536,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.12,"output":0.2},"parameters":7},{"id":"allenai/olmo-3.1-32b-instruct","name":"AllenAI: Olmo 3.1 32B Instruct","created_by":"allenai","source":"official","last_updated":"2026-05-01","description":"Olmo 3.1 32B Instruct is a large-scale, 32-billion-parameter instruction-tuned language model engineered for high-performance conversational AI, multi-turn dialogue, and practical instruction following.","context_window":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.2,"output":0.6},"parameters":32,"release_date":"2026-01-06","tagline":"Olmo 3.1 32B Instruct is a large-scale, 32-billion-parameter instruction-tuned language model engineered for high-performance conversational AI, multi-turn dialogue, and practical instruction followin","tools":["function_calling"],"max_output_tokens":16384,"status":"deprecated","deprecation_date":"2026-05-07"},{"id":"allenai/olmo-3.1-32b-think","name":"AllenAI: Olmo 3.1 32B Think","created_by":"allenai","source":"official","last_updated":"2026-03-24","description":"Olmo 3.1 32B Think is a large-scale, 32-billion-parameter model designed for deep reasoning, complex multi-step logic, and advanced instruction following.","context_window":65536,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.15,"output":0.5},"parameters":32,"status":"deprecated","release_date":"2025-12-16","deprecation_date":"2026-04-06","tagline":"Olmo 3.1 32B Think is a large-scale, 32-billion-parameter model designed for deep reasoning, complex multi-step logic, and advanced instruction following."},{"id":"alpindale/goliath-120b","name":"Goliath 120B","created_by":"alpindale","source":"official","last_updated":"2026-03-24","description":"A large LLM created by combining two fine-tuned Llama 70B models into one 120B model.","context_window":6144,"max_output_tokens":1024,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":3.75,"output":7.5},"parameters":120,"release_date":"2023-11-10","tagline":"A large LLM created by combining two fine-tuned Llama 70B models into one 120B model."},{"id":"amazon/nova-2-lite-v1","name":"Amazon: Nova 2 Lite","created_by":"amazon","source":"official","last_updated":"2026-03-23","description":"Nova 2 Lite is a fast, cost-effective reasoning model for everyday workloads that can process text, images, and videos to generate text.","context_window":1000000,"max_output_tokens":65535,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"pricing":{"input":0.3,"output":2.5},"model_type":"chat","release_date":"2025-12-02","tagline":"Nova 2 Lite is a fast, cost-effective reasoning model for everyday workloads that can process text, images, and videos to generate text.","tools":["function_calling"]},{"id":"amazon/nova-lite-v1","name":"Amazon: Nova Lite 1.0","created_by":"amazon","source":"official","last_updated":"2026-03-23","description":"Amazon Nova Lite 1.0 is a very low-cost multimodal model from Amazon that focused on fast processing of image, video, and text inputs to generate text output.","context_window":300000,"max_output_tokens":5120,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":0.06,"output":0.24},"model_type":"chat","release_date":"2024-12-05","tagline":"Amazon Nova Lite 1.0 is a very low-cost multimodal model from Amazon that focused on fast processing of image, video, and text inputs to generate text output.","tools":["function_calling"]},{"id":"amazon/nova-micro-v1","name":"Amazon: Nova Micro 1.0","created_by":"amazon","source":"official","last_updated":"2026-03-23","description":"Amazon Nova Micro 1.0 is a text-only model that delivers the lowest latency responses in the Amazon Nova family of models at a very low cost.","context_window":128000,"max_output_tokens":5120,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":0.035,"output":0.14},"model_type":"chat","release_date":"2024-12-05","tagline":"Amazon Nova Micro 1.0 is a text-only model that delivers the lowest latency responses in the Amazon Nova family of models at a very low cost.","tools":["function_calling"]},{"id":"amazon/nova-premier-v1","name":"Amazon: Nova Premier 1.0","created_by":"amazon","source":"official","last_updated":"2026-03-23","description":"Amazon Nova Premier is the most capable of Amazon’s multimodal models for complex reasoning tasks and for use as the best teacher for distilling custom models.","context_window":1000000,"max_output_tokens":32000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":2.5,"output":12.5,"cached_input":0.625},"model_type":"chat","release_date":"2025-10-31","tagline":"Amazon Nova Premier is the most capable of Amazon’s multimodal models for complex reasoning tasks and for use as the best teacher for distilling custom models.","tools":["function_calling"]},{"id":"amazon/nova-pro-v1","name":"Amazon: Nova Pro 1.0","created_by":"amazon","source":"official","last_updated":"2026-03-23","description":"Amazon Nova Pro 1.0 is a capable multimodal model from Amazon focused on providing a combination of accuracy, speed, and cost for a wide range of tasks.","context_window":300000,"max_output_tokens":5120,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":0.8,"output":3.2},"model_type":"chat","release_date":"2024-12-05","tagline":"Amazon Nova Pro 1.0 is a capable multimodal model from Amazon focused on providing a combination of accuracy, speed, and cost for a wide range of tasks.","tools":["function_calling"]},{"id":"anthracite-org/magnum-v4-72b","name":"Magnum v4 72B","created_by":"anthracite-org","source":"official","last_updated":"2026-05-17","description":"This is a series of models designed to replicate the prose quality of the Claude 3 models, specifically Sonnet(https://openrouter.ai/anthropic/claude-3.5-sonnet) and Opus(https://openrouter.ai/anthropic/claude-3-opus).","context_window":32768,"max_output_tokens":2048,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":3,"output":5},"parameters":72,"release_date":"2024-10-22","tagline":"This is a series of models designed to replicate the prose quality of the Claude 3 models, specifically Sonnet(https://openrouter.ai/anthropic/claude-3.5-sonnet) and Opus(https://openrouter.ai/anthrop"},{"id":"anthropic/claude-3-haiku","name":"Anthropic: Claude 3 Haiku","created_by":"anthropic","source":"official","last_updated":"2026-03-23","family":"claude-haiku","description":"Claude 3 Haiku is Anthropic's fastest and most compact model for\nnear-instant responsiveness. Quick and accurate targeted performance.\n\nSee the launch announcement and benchmark results [here](https:/","context_window":200000,"max_output_tokens":4096,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"streaming":true,"vision":true,"batch":true},"pricing":{"input":0.25,"output":1.25,"cached_input":0.03},"model_type":"chat","release_date":"2024-03-13","tagline":"Claude 3 Haiku is Anthropic's fastest and most compact model for\nnear-instant responsiveness. Quick and accurate targeted performance.\n\nSee the launch announcement and benchmark results [here](https:/","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"anthropic/claude-3.5-haiku","name":"Anthropic: Claude 3.5 Haiku","created_by":"anthropic","source":"official","last_updated":"2026-03-23","family":"claude-haiku","description":"Claude 3.5 Haiku features offers enhanced capabilities in speed, coding accuracy, and tool use.","context_window":200000,"max_output_tokens":8192,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":0.8,"output":4,"cached_input":0.08},"model_type":"chat","release_date":"2024-11-04","tagline":"Claude 3.5 Haiku features offers enhanced capabilities in speed, coding accuracy, and tool use.","tools":["function_calling"]},{"id":"anthropic/claude-3.5-sonnet","name":"Anthropic: Claude 3.5 Sonnet","created_by":"anthropic","source":"official","last_updated":"2026-03-23","family":"claude-sonnet","description":"New Claude 3.5 Sonnet delivers better-than-Opus capabilities, faster-than-Sonnet speeds, at the same Sonnet prices.","context_window":200000,"max_output_tokens":8192,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":6,"output":30,"cached_input":0.6},"model_type":"chat","release_date":"2024-10-22","tagline":"New Claude 3.5 Sonnet delivers better-than-Opus capabilities, faster-than-Sonnet speeds, at the same Sonnet prices.","tools":["function_calling"]},{"id":"anthropic/claude-3.7-sonnet:thinking","name":"Anthropic: Claude 3.7 Sonnet (thinking)","created_by":"anthropic","source":"official","last_updated":"2026-05-06","family":"claude-sonnet","description":"Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities.","status":"deprecated","deprecation_date":"2026-05-11","context_window":200000,"max_output_tokens":64000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"pricing":{"input":3,"output":15,"cached_input":0.3},"model_type":"chat","release_date":"2025-02-24","tagline":"Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities.","tools":["function_calling"]},{"id":"anthropic/claude-3.7-sonnet","name":"Anthropic: Claude 3.7 Sonnet","created_by":"anthropic","source":"official","last_updated":"2026-05-06","family":"claude-sonnet","description":"Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities.","status":"deprecated","deprecation_date":"2026-05-11","context_window":200000,"max_output_tokens":64000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"pricing":{"input":3,"output":15,"cached_input":0.3},"model_type":"chat","release_date":"2025-02-24","tagline":"Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities.","tools":["function_calling"]},{"id":"anthropic/claude-fable-5","name":"Anthropic: Claude Fable 5","created_by":"anthropic","source":"official","family":"claude-fable","description":"Claude Fable 5 is a Mythos-class model from Anthropic, built for autonomous knowledge work and coding.","release_date":"2026-06-09","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"Claude Fable 5 is a Mythos-class model from Anthropic, built for autonomous knowledge work and coding.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":10,"output":50,"cached_input":1},"tools":["function_calling"],"last_updated":"2026-06-18","license":"proprietary","open_weight":false},{"id":"anthropic/claude-haiku-4.5","name":"Anthropic: Claude Haiku 4.5","created_by":"anthropic","source":"official","last_updated":"2026-05-14","family":"claude-haiku","description":"Claude Haiku 4.5 is Anthropic’s fastest and most efficient model, delivering near-frontier intelligence at a fraction of the cost and latency of larger Claude models.","context_window":200000,"max_output_tokens":64000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":1,"output":5,"cached_input":0.1},"model_type":"chat","release_date":"2025-10-15","tagline":"Claude Haiku 4.5 is Anthropic’s fastest and most efficient model, delivering near-frontier intelligence at a fraction of the cost and latency of larger Claude models.","tools":["function_calling"]},{"id":"anthropic/claude-opus-4.1","name":"Anthropic: Claude Opus 4.1","created_by":"anthropic","source":"official","last_updated":"2026-03-24","family":"claude-opus","description":"Claude Opus 4.1 is an updated version of Anthropic’s flagship model, offering improved performance in coding, reasoning, and agentic tasks.","context_window":200000,"max_output_tokens":32000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":15,"output":75,"cached_input":1.5},"model_type":"chat","release_date":"2025-08-05","tagline":"Claude Opus 4.1 is an updated version of Anthropic’s flagship model, offering improved performance in coding, reasoning, and agentic tasks.","tools":["function_calling"]},{"id":"anthropic/claude-opus-4.5","name":"Anthropic: Claude Opus 4.5","created_by":"anthropic","source":"official","last_updated":"2026-03-24","family":"claude-opus","description":"Claude Opus 4.5 is Anthropic’s frontier reasoning model optimized for complex software engineering, agentic workflows, and long-horizon computer use.","context_window":200000,"max_output_tokens":64000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":5,"output":25,"cached_input":0.5},"model_type":"chat","release_date":"2025-11-24","tagline":"Claude Opus 4.5 is Anthropic’s frontier reasoning model optimized for complex software engineering, agentic workflows, and long-horizon computer use.","tools":["function_calling"]},{"id":"anthropic/claude-opus-4.6-fast","name":"Anthropic: Claude Opus 4.6 (Fast)","created_by":"anthropic","source":"official","family":"claude-opus","description":"Fast-mode variant of [Opus 4.6](/anthropic/claude-opus-4.6) - identical capabilities with higher output speed at premium 6x pricing.","release_date":"2026-04-07","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"Fast-mode variant of [Opus 4.6](/anthropic/claude-opus-4.6) - identical capabilities with higher output speed at premium 6x pricing.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":30,"output":150,"cached_input":3},"tools":["function_calling"],"last_updated":"2026-05-29","status":"deprecated","deprecation_date":"2026-06-29"},{"id":"anthropic/claude-opus-4.6","name":"Anthropic: Claude Opus 4.6","created_by":"anthropic","source":"official","last_updated":"2026-03-24","family":"claude-opus","description":"Opus 4.6 is Anthropic’s strongest model for coding and long-running professional tasks.","context_window":1000000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":5,"output":25,"cached_input":0.5},"model_type":"chat","release_date":"2026-02-04","tagline":"Opus 4.6 is Anthropic’s strongest model for coding and long-running professional tasks.","tools":["function_calling"]},{"id":"anthropic/claude-opus-4.7-fast","name":"Anthropic: Claude Opus 4.7 (Fast)","created_by":"anthropic","source":"official","family":"claude-opus","description":"Fast-mode variant of [Opus 4.7](/anthropic/claude-opus-4.7) - identical capabilities with higher output speed at premium 6x pricing.","release_date":"2026-05-12","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"Fast-mode variant of [Opus 4.7](/anthropic/claude-opus-4.7) - identical capabilities with higher output speed at premium 6x pricing.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":30,"output":150,"cached_input":3},"tools":["function_calling"],"last_updated":"2026-05-14"},{"id":"anthropic/claude-opus-4.7","name":"Anthropic: Claude Opus 4.7","created_by":"anthropic","source":"official","family":"claude-opus","description":"Opus 4.7 is the next generation of Anthropic's Opus family, built for long-running, asynchronous agents.","release_date":"2026-04-16","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"Opus 4.7 is the next generation of Anthropic's Opus family, built for long-running, asynchronous agents.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5,"output":25,"cached_input":0.5},"tools":["function_calling"],"last_updated":"2026-04-17"},{"id":"anthropic/claude-opus-4.8-fast","name":"Anthropic: Claude Opus 4.8 (Fast)","created_by":"anthropic","source":"official","family":"claude-opus","description":"Fast-mode variant of [Opus 4.8](/anthropic/claude-opus-4.8) - identical capabilities with higher output speed at 2x pricing relative to regular Opus 4.8.","release_date":"2026-05-27","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"Fast-mode variant of [Opus 4.8](/anthropic/claude-opus-4.8) - identical capabilities with higher output speed at 2x pricing relative to regular Opus 4.8.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":10,"output":50,"cached_input":1},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"anthropic/claude-opus-4.8","name":"Anthropic: Claude Opus 4.8","created_by":"anthropic","source":"official","family":"claude-opus","description":"Claude Opus 4.8 is Anthropic's most capable generally available model in the Opus family.","release_date":"2026-05-27","context_window":1000000,"max_output_tokens":128000,"model_type":"chat","tagline":"Claude Opus 4.8 is Anthropic's most capable generally available model in the Opus family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5,"output":25,"cached_input":0.5},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"anthropic/claude-opus-4","name":"Anthropic: Claude Opus 4","created_by":"anthropic","source":"official","last_updated":"2026-03-23","family":"claude-opus","description":"Claude Opus 4 is benchmarked as the world’s best coding model, at time of release, bringing sustained performance on complex, long-running tasks and agent workflows.","context_window":200000,"max_output_tokens":32000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"pricing":{"input":15,"output":75,"cached_input":1.5},"model_type":"chat","release_date":"2025-05-22","tagline":"Claude Opus 4 is benchmarked as the world’s best coding model, at time of release, bringing sustained performance on complex, long-running tasks and agent workflows.","tools":["function_calling"]},{"id":"anthropic/claude-sonnet-4.5","name":"Anthropic: Claude Sonnet 4.5","created_by":"anthropic","source":"official","last_updated":"2026-03-24","family":"claude-sonnet","description":"Claude Sonnet 4.5 is Anthropic’s most advanced Sonnet model to date, optimized for real-world agents and coding workflows.","context_window":1000000,"max_output_tokens":64000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":3,"output":15,"cached_input":0.3},"model_type":"chat","release_date":"2025-09-29","tagline":"Claude Sonnet 4.5 is Anthropic’s most advanced Sonnet model to date, optimized for real-world agents and coding workflows.","tools":["function_calling"]},{"id":"anthropic/claude-sonnet-4.6","name":"Anthropic: Claude Sonnet 4.6","created_by":"anthropic","source":"official","last_updated":"2026-03-24","family":"claude-sonnet","description":"Sonnet 4.6 is Anthropic's most capable Sonnet-class model yet, with frontier performance across coding, agents, and professional work.","context_window":1000000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":3,"output":15,"cached_input":0.3},"model_type":"chat","release_date":"2026-02-17","tagline":"Sonnet 4.6 is Anthropic's most capable Sonnet-class model yet, with frontier performance across coding, agents, and professional work.","tools":["function_calling"]},{"id":"anthropic/claude-sonnet-4","name":"Anthropic: Claude Sonnet 4","created_by":"anthropic","source":"official","last_updated":"2026-04-12","family":"claude-sonnet","description":"Claude Sonnet 4 significantly enhances the capabilities of its predecessor, Sonnet 3.7, excelling in both coding and reasoning tasks with improved precision and controllability.","context_window":1000000,"max_output_tokens":64000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"pricing":{"input":3,"output":15,"cached_input":0.3},"model_type":"chat","release_date":"2025-05-22","tagline":"Claude Sonnet 4 significantly enhances the capabilities of its predecessor, Sonnet 3.7, excelling in both coding and reasoning tasks with improved precision and controllability.","tools":["function_calling"]},{"id":"arcee-ai/coder-large","name":"Arcee AI: Coder Large","created_by":"arcee-ai","source":"official","last_updated":"2026-04-07","description":"Coder‑Large is a 32 B‑parameter offspring of Qwen 2.5‑Instruct that has been further trained on permissively‑licensed GitHub, CodeSearchNet and synthetic bug‑fix corpora.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.5,"output":0.8},"release_date":"2025-05-05","tagline":"Coder‑Large is a 32 B‑parameter offspring of Qwen 2.5‑Instruct that has been further trained on permissively‑licensed GitHub, CodeSearchNet and synthetic bug‑fix corpora."},{"id":"arcee-ai/maestro-reasoning","name":"Arcee AI: Maestro Reasoning","created_by":"arcee-ai","source":"official","last_updated":"2026-04-07","description":"Maestro Reasoning is Arcee's flagship analysis model: a 32 B‑parameter derivative of Qwen 2.5‑32 B tuned with DPO and chain‑of‑thought RL for step‑by‑step logic.","context_window":131072,"max_output_tokens":32000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.9,"output":3.3},"model_type":"reasoning","release_date":"2025-05-05","tagline":"Maestro Reasoning is Arcee's flagship analysis model: a 32 B‑parameter derivative of Qwen 2.5‑32 B tuned with DPO and chain‑of‑thought RL for step‑by‑step logic."},{"id":"arcee-ai/spotlight","name":"Arcee AI: Spotlight","created_by":"arcee-ai","source":"official","last_updated":"2026-04-07","description":"Spotlight is a 7‑billion‑parameter vision‑language model derived from Qwen 2.5‑VL and fine‑tuned by Arcee AI for tight image‑text grounding tasks.","context_window":131072,"max_output_tokens":65537,"modalities":{"input":["image","text"],"output":["text"]},"pricing":{"input":0.18,"output":0.18},"release_date":"2025-05-05","tagline":"Spotlight is a 7‑billion‑parameter vision‑language model derived from Qwen 2.5‑VL and fine‑tuned by Arcee AI for tight image‑text grounding tasks."},{"id":"arcee-ai/trinity-large-preview:free","name":"Arcee AI: Trinity Large Preview (free)","created_by":"arcee-ai","source":"official","last_updated":"2026-04-10","description":"Trinity-Large-Preview is a frontier-scale open-weight language model from Arcee, built as a 400B-parameter sparse Mixture-of-Experts with 13B active parameters per token using 4-of-256 expert routing.","context_window":131000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"release_date":"2026-01-27","tagline":"Trinity-Large-Preview is a frontier-scale open-weight language model from Arcee, built as a 400B-parameter sparse Mixture-of-Experts with 13B active parameters per token using 4-of-256 expert routing.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-04-22"},{"id":"arcee-ai/trinity-large-preview","name":"Arcee AI: Trinity Large Preview","created_by":"arcee-ai","source":"official","description":"Trinity-Large-Preview is a frontier-scale open-weight language model from Arcee, built as a 400B-parameter sparse Mixture-of-Experts with 13B active parameters per token using 4-of-256 expert routing.","release_date":"2026-01-27","context_window":131000,"tagline":"Trinity-Large-Preview is a frontier-scale open-weight language model from Arcee, built as a 400B-parameter sparse Mixture-of-Experts with 13B active parameters per token using 4-of-256 expert routing.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.15,"output":0.45},"tools":["function_calling"],"last_updated":"2026-04-24"},{"id":"arcee-ai/trinity-large-thinking:free","name":"Arcee AI: Trinity Large Thinking (free)","created_by":"arcee-ai","source":"official","description":"Trinity Large Thinking is a powerful open source reasoning model from the team at Arcee AI.","release_date":"2026-04-01","context_window":262144,"max_output_tokens":80000,"tagline":"Trinity Large Thinking is a powerful open source reasoning model from the team at Arcee AI.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-14"},{"id":"arcee-ai/trinity-large-thinking","name":"Arcee AI: Trinity Large Thinking","created_by":"arcee-ai","source":"official","description":"Trinity Large Thinking is a powerful open source reasoning model from the team at Arcee AI.","release_date":"2026-04-01","context_window":262144,"max_output_tokens":80000,"tagline":"Trinity Large Thinking is a powerful open source reasoning model from the team at Arcee AI.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.25,"output":0.8,"cached_input":0.06},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"arcee-ai/trinity-mini:free","name":"Arcee AI: Trinity Mini (free)","created_by":"arcee-ai","source":"official","last_updated":"2026-04-03","description":"Trinity Mini is a 26B-parameter (3B active) sparse mixture-of-experts language model featuring 128 experts with 8 active per token.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"release_date":"2025-12-01","tagline":"Trinity Mini is a 26B-parameter (3B active) sparse mixture-of-experts language model featuring 128 experts with 8 active per token.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-04-10"},{"id":"arcee-ai/trinity-mini","name":"Arcee AI: Trinity Mini","created_by":"arcee-ai","source":"official","last_updated":"2026-03-24","description":"Trinity Mini is a 26B-parameter (3B active) sparse mixture-of-experts language model featuring 128 experts with 8 active per token.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.045,"output":0.15},"release_date":"2025-12-01","tagline":"Trinity Mini is a 26B-parameter (3B active) sparse mixture-of-experts language model featuring 128 experts with 8 active per token.","tools":["function_calling"]},{"id":"arcee-ai/virtuoso-large","name":"Arcee AI: Virtuoso Large","created_by":"arcee-ai","source":"official","last_updated":"2026-04-07","description":"Virtuoso‑Large is Arcee's top‑tier general‑purpose LLM at 72 B parameters, tuned to tackle cross‑domain reasoning, creative writing and enterprise QA.","context_window":131072,"max_output_tokens":64000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":0.75,"output":1.2},"release_date":"2025-05-05","tagline":"Virtuoso‑Large is Arcee's top‑tier general‑purpose LLM at 72 B parameters, tuned to tackle cross‑domain reasoning, creative writing and enterprise QA.","tools":["function_calling"]},{"id":"baidu/cobuddy:free","name":"Baidu Qianfan: CoBuddy (free)","created_by":"baidu","source":"official","description":"CoBuddy is a code generation model from Baidu, optimized for coding tasks and AI Agent workflows.","release_date":"2026-05-06","context_window":131072,"max_output_tokens":65536,"tagline":"CoBuddy is a code generation model from Baidu, optimized for coding tasks and AI Agent workflows.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-06"},{"id":"baidu/ernie-4.5-21b-a3b-thinking","name":"Baidu: ERNIE 4.5 21B A3B Thinking","created_by":"baidu","source":"official","last_updated":"2026-03-23","description":"ERNIE-4.5-21B-A3B-Thinking is Baidu's upgraded lightweight MoE model, refined to boost reasoning depth and quality for top-tier performance in logical puzzles, math, science, coding, text generation, ","context_window":131072,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"reasoning":true},"pricing":{"input":0.07,"output":0.28},"parameters":21,"active_parameters":3,"release_date":"2025-10-09","tagline":"ERNIE-4.5-21B-A3B-Thinking is Baidu's upgraded lightweight MoE model, refined to boost reasoning depth and quality for top-tier performance in logical puzzles, math, science, coding, text generation, "},{"id":"baidu/ernie-4.5-21b-a3b","name":"Baidu: ERNIE 4.5 21B A3B","created_by":"baidu","source":"official","last_updated":"2026-05-17","description":"A sophisticated text-based Mixture-of-Experts (MoE) model featuring 21B total parameters with 3B activated per token, delivering exceptional multimodal understanding and generation through heterogeneous MoE structures and modality-isolated routing.","context_window":131072,"max_output_tokens":8000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":0.07,"output":0.28},"parameters":21,"active_parameters":3,"release_date":"2025-08-12","tagline":"A sophisticated text-based Mixture-of-Experts (MoE) model featuring 21B total parameters with 3B activated per token, delivering exceptional multimodal understanding and generation through heterogeneo","tools":["function_calling"]},{"id":"baidu/ernie-4.5-300b-a47b","name":"Baidu: ERNIE 4.5 300B A47B ","created_by":"baidu","source":"official","last_updated":"2026-05-17","description":"ERNIE-4.5-300B-A47B is a 300B parameter Mixture-of-Experts (MoE) language model developed by Baidu as part of the ERNIE 4.5 series.","context_window":131072,"max_output_tokens":12000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.28,"output":1.1},"parameters":300,"active_parameters":47,"release_date":"2025-06-30","tagline":"ERNIE-4.5-300B-A47B is a 300B parameter Mixture-of-Experts (MoE) language model developed by Baidu as part of the ERNIE 4.5 series."},{"id":"baidu/ernie-4.5-vl-28b-a3b","name":"Baidu: ERNIE 4.5 VL 28B A3B","created_by":"baidu","source":"official","last_updated":"2026-05-17","description":"A powerful multimodal Mixture-of-Experts chat model featuring 28B total parameters with 3B activated per token, delivering exceptional text and vision understanding through its innovative heterogeneou","context_window":131072,"max_output_tokens":8000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"pricing":{"input":0.14,"output":0.56},"parameters":28,"active_parameters":3,"release_date":"2025-08-12","tagline":"A powerful multimodal Mixture-of-Experts chat model featuring 28B total parameters with 3B activated per token, delivering exceptional text and vision understanding through its innovative heterogeneou","tools":["function_calling"]},{"id":"baidu/ernie-4.5-vl-424b-a47b","name":"Baidu: ERNIE 4.5 VL 424B A47B ","created_by":"baidu","source":"official","last_updated":"2026-05-17","description":"ERNIE-4.5-VL-424B-A47B is a multimodal Mixture-of-Experts (MoE) model from Baidu’s ERNIE 4.5 series, featuring 424B total parameters with 47B active per token.","context_window":131072,"max_output_tokens":16000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"reasoning":true},"pricing":{"input":0.42,"output":1.25},"parameters":424,"active_parameters":47,"release_date":"2025-06-30","tagline":"ERNIE-4.5-VL-424B-A47B is a multimodal Mixture-of-Experts (MoE) model from Baidu’s ERNIE 4.5 series, featuring 424B total parameters with 47B active per token."},{"id":"baidu/qianfan-ocr-fast:free","name":"Baidu: Qianfan-OCR-Fast (free)","created_by":"baidu","source":"official","description":"Qianfan-OCR-Fast is a domain-specific multimodal large model purpose-built for OCR.","release_date":"2026-04-20","context_window":65536,"max_output_tokens":28672,"tagline":"Qianfan-OCR-Fast is a domain-specific multimodal large model purpose-built for OCR.","capabilities":{"reasoning":true},"modalities":{"input":["image","text"],"output":["text"]},"last_updated":"2026-04-24"},{"id":"baidu/qianfan-ocr-fast","name":"Baidu: Qianfan-OCR-Fast","created_by":"baidu","source":"official","description":"Qianfan-OCR-Fast is a domain-specific multimodal large model purpose-built for OCR.","release_date":"2026-04-20","context_window":65536,"max_output_tokens":28672,"tagline":"Qianfan-OCR-Fast is a domain-specific multimodal large model purpose-built for OCR.","capabilities":{"reasoning":true},"modalities":{"input":["image","text"],"output":["text"]},"pricing":{"input":0.68,"output":2.81},"last_updated":"2026-05-23","status":"deprecated","deprecation_date":"2026-05-28"},{"id":"bytedance-seed/seed-1.6-flash","name":"ByteDance Seed: Seed 1.6 Flash","created_by":"bytedance-seed","source":"official","last_updated":"2026-03-24","description":"Seed 1.6 Flash is an ultra-fast multimodal deep thinking model by ByteDance Seed, supporting both text and visual understanding.","context_window":262144,"max_output_tokens":32768,"modalities":{"input":["image","text","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.075,"output":0.3},"release_date":"2025-12-23","tagline":"Seed 1.6 Flash is an ultra-fast multimodal deep thinking model by ByteDance Seed, supporting both text and visual understanding.","tools":["function_calling"]},{"id":"bytedance-seed/seed-1.6","name":"ByteDance Seed: Seed 1.6","created_by":"bytedance-seed","source":"official","last_updated":"2026-03-24","description":"Seed 1.6 is a general-purpose model released by the ByteDance Seed team.","context_window":262144,"max_output_tokens":32768,"modalities":{"input":["image","text","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.25,"output":2},"release_date":"2025-12-23","tagline":"Seed 1.6 is a general-purpose model released by the ByteDance Seed team.","tools":["function_calling"]},{"id":"bytedance-seed/seed-2.0-lite","name":"ByteDance Seed: Seed-2.0-Lite","created_by":"bytedance-seed","source":"official","last_updated":"2026-04-07","description":"Seed-2.0-Lite is a versatile, cost‑efficient enterprise workhorse that delivers strong multimodal and agent capabilities while offering noticeably lower latency, making it a practical default choice f","context_window":262144,"max_output_tokens":131072,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.25,"output":2},"release_date":"2026-03-10","tagline":"Seed-2.0-Lite is a versatile, cost‑efficient enterprise workhorse that delivers strong multimodal and agent capabilities while offering noticeably lower latency, making it a practical default choice f","tools":["function_calling"]},{"id":"bytedance-seed/seed-2.0-mini","name":"ByteDance Seed: Seed-2.0-Mini","created_by":"bytedance-seed","source":"official","last_updated":"2026-03-24","description":"Seed-2.0-mini targets latency-sensitive, high-concurrency, and cost-sensitive scenarios, emphasizing fast response and flexible inference deployment.","context_window":262144,"max_output_tokens":131072,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.1,"output":0.4},"release_date":"2026-02-26","tagline":"Seed-2.0-mini targets latency-sensitive, high-concurrency, and cost-sensitive scenarios, emphasizing fast response and flexible inference deployment.","tools":["function_calling"]},{"id":"bytedance/ui-tars-1.5-7b","name":"ByteDance: UI-TARS 7B ","created_by":"bytedance","source":"official","last_updated":"2026-06-18","description":"UI-TARS-1.5 is a multimodal vision-language agent optimized for GUI-based environments, including desktop interfaces, web browsers, mobile systems, and games.","context_window":128000,"max_output_tokens":2048,"modalities":{"input":["image","text"],"output":["text"]},"pricing":{"input":0.1,"output":0.2,"cached_input":0.1},"parameters":7,"release_date":"2025-07-22","tagline":"UI-TARS-1.5 is a multimodal vision-language agent optimized for GUI-based environments, including desktop interfaces, web browsers, mobile systems, and games.","capabilities":{"structured_output":true,"json_mode":true}},{"id":"cognitivecomputations/dolphin-mistral-24b-venice-edition:free","name":"Venice: Uncensored (free)","created_by":"cognitivecomputations","source":"official","last_updated":"2026-03-24","description":"Venice Uncensored Dolphin Mistral 24B Venice Edition is a fine-tuned variant of Mistral-Small-24B-Instruct-2501, developed by dphn.ai in collaboration with Venice.ai.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"parameters":24,"release_date":"2025-07-09","tagline":"Venice Uncensored Dolphin Mistral 24B Venice Edition is a fine-tuned variant of Mistral-Small-24B-Instruct-2501, developed by dphn.ai in collaboration with Venice.ai."},{"id":"cohere/command-a","name":"Cohere: Command A","created_by":"cohere","source":"official","last_updated":"2026-03-24","description":"Command A is an open-weights 111B parameter model with a 256k context window focused on delivering great performance across agentic, multilingual, and coding use cases.","context_window":256000,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":2.5,"output":10},"family":"command-a","model_type":"chat","release_date":"2025-03-13","tagline":"Command A is an open-weights 111B parameter model with a 256k context window focused on delivering great performance across agentic, multilingual, and coding use cases."},{"id":"cohere/command-r-08-2024","name":"Cohere: Command R (08-2024)","created_by":"cohere","source":"official","last_updated":"2026-03-24","description":"command-r-08-2024 is an update of the [Command R](/models/cohere/command-r) with improved performance for multilingual retrieval-augmented generation (RAG) and tool use.","context_window":128000,"max_output_tokens":4000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.15,"output":0.6},"family":"command-r","model_type":"chat","release_date":"2024-08-30","tagline":"command-r-08-2024 is an update of the [Command R](/models/cohere/command-r) with improved performance for multilingual retrieval-augmented generation (RAG) and tool use.","tools":["function_calling"],"license":"cc-by-nc-4.0","open_weight":true},{"id":"cohere/command-r-plus-08-2024","name":"Cohere: Command R+ (08-2024)","created_by":"cohere","source":"official","last_updated":"2026-04-07","description":"command-r-plus-08-2024 is an update of the [Command R+](/models/cohere/command-r-plus) with roughly 50% higher throughput and 25% lower latencies as compared to the previous Command R+ version, while ","context_window":128000,"max_output_tokens":4000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":2.5,"output":10},"family":"command-r-plus","model_type":"chat","release_date":"2024-08-30","tagline":"command-r-plus-08-2024 is an update of the [Command R+](/models/cohere/command-r-plus) with roughly 50% higher throughput and 25% lower latencies as compared to the previous Command R+ version, while ","tools":["function_calling"],"license":"cc-by-nc-4.0","open_weight":true},{"id":"cohere/command-r7b-12-2024","name":"Cohere: Command R7B (12-2024)","created_by":"cohere","source":"official","last_updated":"2026-03-24","description":"Command R7B (12-2024) is a small, fast update of the Command R+ model, delivered in December 2024.","context_window":128000,"max_output_tokens":4000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"tool_call":true,"reasoning":true,"fine_tuning":true},"pricing":{"input":0.038,"output":0.15},"family":"command-r","model_type":"chat","release_date":"2024-12-14","tagline":"Command R7B (12-2024) is a small, fast update of the Command R+ model, delivered in December 2024.","license":"cc-by-nc-4.0","open_weight":true},{"id":"cohere/north-mini-code:free","name":"Cohere: North Mini Code (free)","created_by":"cohere","source":"official","description":"North Mini Code is Cohere's first agentic coding model and the debut of its North family.","release_date":"2026-06-17","context_window":256000,"max_output_tokens":64000,"tagline":"North Mini Code is Cohere's first agentic coding model and the debut of its North family.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-18"},{"id":"deepcogito/cogito-v2.1-671b","name":"Deep Cogito: Cogito v2.1 671B","created_by":"deepcogito","source":"official","last_updated":"2026-03-24","description":"Cogito v2.1 671B MoE represents one of the strongest open models globally, matching performance of frontier closed and open models.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":1.25,"output":1.25},"parameters":671,"release_date":"2025-11-13","tagline":"Cogito v2.1 671B MoE represents one of the strongest open models globally, matching performance of frontier closed and open models.","model_type":"chat"},{"id":"deepseek/deepseek-chat-v3-0324","name":"DeepSeek: DeepSeek V3 0324","created_by":"deepseek","source":"official","last_updated":"2026-04-25","family":"deepseek-chat","description":"DeepSeek V3, a 685B-parameter, mixture-of-experts model, is the latest iteration of the flagship chat model family from the DeepSeek team.","context_window":163840,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.2,"output":0.77,"cached_input":0.135},"release_date":"2025-03-24","tagline":"DeepSeek V3, a 685B-parameter, mixture-of-experts model, is the latest iteration of the flagship chat model family from the DeepSeek team.","tools":["function_calling"],"model_type":"chat","max_output_tokens":16384},{"id":"deepseek/deepseek-chat-v3.1","name":"DeepSeek: DeepSeek V3.1","created_by":"deepseek","source":"official","last_updated":"2026-05-14","family":"deepseek-chat","description":"DeepSeek-V3.1 is a large hybrid reasoning model (671B parameters, 37B active) that supports both thinking and non-thinking modes via prompt templates.","context_window":163840,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.21,"output":0.79,"cached_input":0.13},"release_date":"2025-08-21","tagline":"DeepSeek-V3.1 is a large hybrid reasoning model (671B parameters, 37B active) that supports both thinking and non-thinking modes via prompt templates.","tools":["function_calling"],"model_type":"chat"},{"id":"deepseek/deepseek-chat","name":"DeepSeek: DeepSeek V3","created_by":"deepseek","source":"official","last_updated":"2026-06-02","family":"deepseek-chat","description":"DeepSeek-V3 is the latest model from the DeepSeek team, building upon the instruction following and coding abilities of the previous versions.","context_window":131072,"max_output_tokens":16000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.2,"output":0.8},"release_date":"2024-12-26","tagline":"DeepSeek-V3 is the latest model from the DeepSeek team, building upon the instruction following and coding abilities of the previous versions.","tools":["function_calling"],"model_type":"chat","license":"mit","open_weight":true},{"id":"deepseek/deepseek-r1-0528","name":"DeepSeek: R1 0528","created_by":"deepseek","source":"official","last_updated":"2026-04-25","family":"deepseek-r1","description":"May 28th update to the [original DeepSeek R1](/deepseek/deepseek-r1) Performance on par with [OpenAI o1](/openai/o1), but open-sourced and with fully open reasoning tokens.","context_window":163840,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.5,"output":2.15,"cached_input":0.35},"model_type":"reasoning","release_date":"2025-05-28","tagline":"May 28th update to the [original DeepSeek R1](/deepseek/deepseek-r1) Performance on par with [OpenAI o1](/openai/o1), but open-sourced and with fully open reasoning tokens.","tools":["function_calling"]},{"id":"deepseek/deepseek-r1-distill-llama-70b","name":"DeepSeek: R1 Distill Llama 70B","created_by":"deepseek","source":"official","last_updated":"2026-06-18","family":"deepseek-r1","description":"DeepSeek R1 Distill Llama 70B is a distilled large language model based on [Llama-3.3-70B-Instruct](/meta-llama/llama-3.3-70b-instruct), using outputs from [DeepSeek R1](/deepseek/deepseek-r1).","context_window":128000,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.8,"output":0.8},"model_type":"reasoning","parameters":70,"release_date":"2025-01-23","tagline":"DeepSeek R1 Distill Llama 70B is a distilled large language model based on [Llama-3.3-70B-Instruct](/meta-llama/llama-3.3-70b-instruct), using outputs from [DeepSeek R1](/deepseek/deepseek-r1).","status":"deprecated","deprecation_date":"2026-06-11"},{"id":"deepseek/deepseek-r1-distill-qwen-32b","name":"DeepSeek: R1 Distill Qwen 32B","created_by":"deepseek","source":"official","last_updated":"2026-05-17","family":"deepseek-r1","description":"DeepSeek R1 Distill Qwen 32B is a distilled large language model based on [Qwen 2.5 32B](https://huggingface.co/Qwen/Qwen2.5-32B), using outputs from [DeepSeek R1](/deepseek/deepseek-r1).","context_window":128000,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.29,"output":0.29},"model_type":"reasoning","parameters":32,"release_date":"2025-01-29","tagline":"DeepSeek R1 Distill Qwen 32B is a distilled large language model based on [Qwen 2.5 32B](https://huggingface.co/Qwen/Qwen2.5-32B), using outputs from [DeepSeek R1](/deepseek/deepseek-r1)."},{"id":"deepseek/deepseek-r1","name":"DeepSeek: R1","created_by":"deepseek","source":"official","last_updated":"2026-05-17","family":"deepseek-r1","description":"DeepSeek R1 is here: Performance on par with [OpenAI o1](/openai/o1), but open-sourced and with fully open reasoning tokens.","context_window":163840,"max_output_tokens":16000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.7,"output":2.5},"model_type":"reasoning","release_date":"2025-01-20","tagline":"DeepSeek R1 is here: Performance on par with [OpenAI o1](/openai/o1), but open-sourced and with fully open reasoning tokens.","tools":["function_calling"]},{"id":"deepseek/deepseek-v3.1-terminus","name":"DeepSeek: DeepSeek V3.1 Terminus","created_by":"deepseek","source":"official","last_updated":"2026-05-06","family":"deepseek","description":"DeepSeek-V3.1 Terminus is an update to [DeepSeek V3.1](/deepseek/deepseek-chat-v3.1) that maintains the model's original capabilities while addressing issues reported by users, including language cons","context_window":163840,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.27,"output":0.95,"cached_input":0.13},"release_date":"2025-09-22","tagline":"DeepSeek-V3.1 Terminus is an update to [DeepSeek V3.1](/deepseek/deepseek-chat-v3.1) that maintains the model's original capabilities while addressing issues reported by users, including language cons","tools":["function_calling"],"model_type":"chat"},{"id":"deepseek/deepseek-v3.2-exp","name":"DeepSeek: DeepSeek V3.2 Exp","created_by":"deepseek","source":"official","last_updated":"2026-03-24","family":"deepseek","description":"DeepSeek-V3.2-Exp is an experimental large language model released by DeepSeek as an intermediate step between V3.1 and future architectures.","context_window":163840,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.27,"output":0.41},"release_date":"2025-09-29","tagline":"DeepSeek-V3.2-Exp is an experimental large language model released by DeepSeek as an intermediate step between V3.1 and future architectures.","tools":["function_calling"],"model_type":"chat"},{"id":"deepseek/deepseek-v3.2-speciale","name":"DeepSeek: DeepSeek V3.2 Speciale","created_by":"deepseek","source":"official","last_updated":"2026-05-07","family":"deepseek","description":"DeepSeek-V3.2-Speciale is a high-compute variant of DeepSeek-V3.2 optimized for maximum reasoning and agentic performance.","context_window":163840,"max_output_tokens":163840,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.287,"output":0.431,"cached_input":0.058},"release_date":"2025-12-01","tagline":"DeepSeek-V3.2-Speciale is a high-compute variant of DeepSeek-V3.2 optimized for maximum reasoning and agentic performance.","model_type":"chat"},{"id":"deepseek/deepseek-v3.2","name":"DeepSeek: DeepSeek V3.2","created_by":"deepseek","source":"official","last_updated":"2026-06-29","family":"deepseek","description":"DeepSeek-V3.2 is a large language model designed to harmonize high computational efficiency with strong reasoning and agentic tool-use performance.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.229,"output":0.343,"cached_input":0.023},"release_date":"2025-12-01","tagline":"DeepSeek-V3.2 is a large language model designed to harmonize high computational efficiency with strong reasoning and agentic tool-use performance.","tools":["function_calling"],"model_type":"chat","max_output_tokens":64000},{"id":"deepseek/deepseek-v4-flash:free","name":"DeepSeek: DeepSeek V4 Flash (free)","created_by":"deepseek","source":"official","family":"deepseek","description":"DeepSeek V4 Flash is an efficiency-optimized Mixture-of-Experts model from DeepSeek with 284B total parameters and 13B activated parameters, supporting a 1M-token context window.","release_date":"2026-04-24","context_window":1048576,"max_output_tokens":384000,"model_type":"chat","tagline":"DeepSeek V4 Flash is an efficiency-optimized Mixture-of-Experts model from DeepSeek with 284B total parameters and 13B activated parameters, supporting a 1M-token context window.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-17"},{"id":"deepseek/deepseek-v4-flash","name":"DeepSeek: DeepSeek V4 Flash","created_by":"deepseek","source":"official","family":"deepseek","description":"DeepSeek V4 Flash is an efficiency-optimized Mixture-of-Experts model from DeepSeek with 284B total parameters and 13B activated parameters, supporting a 1M-token context window.","release_date":"2026-04-24","context_window":1048576,"max_output_tokens":65536,"model_type":"chat","tagline":"DeepSeek V4 Flash is an efficiency-optimized Mixture-of-Experts model from DeepSeek with 284B total parameters and 13B activated parameters, supporting a 1M-token context window.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.09,"output":0.18,"cached_input":0.02},"tools":["function_calling"],"last_updated":"2026-06-18","license":"mit","open_weight":true},{"id":"deepseek/deepseek-v4-pro","name":"DeepSeek: DeepSeek V4 Pro","created_by":"deepseek","source":"official","family":"deepseek","description":"DeepSeek V4 Pro is a large-scale Mixture-of-Experts model from DeepSeek with 1.6T total parameters and 49B activated parameters, supporting a 1M-token context window.","release_date":"2026-04-24","context_window":1048576,"max_output_tokens":384000,"model_type":"chat","tagline":"DeepSeek V4 Pro is a large-scale Mixture-of-Experts model from DeepSeek with 1.6T total parameters and 49B activated parameters, supporting a 1M-token context window.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.435,"output":0.87,"cached_input":0.004},"tools":["function_calling"],"last_updated":"2026-04-26","license":"mit","open_weight":true},{"id":"eleutherai/llemma_7b","name":"EleutherAI: Llemma 7b","created_by":"eleutherai","source":"official","last_updated":"2026-03-23","description":"Llemma 7B is a language model for mathematics.","context_window":4096,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.8,"output":1.2},"parameters":7,"release_date":"2025-04-14","tagline":"Llemma 7B is a language model for mathematics."},{"id":"essentialai/rnj-1-instruct","name":"EssentialAI: Rnj 1 Instruct","created_by":"essentialai","source":"official","last_updated":"2026-03-24","description":"Rnj-1 is an 8B-parameter, dense, open-weight model family developed by Essential AI and trained from scratch with a focus on programming, math, and scientific reasoning.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.15,"output":0.15},"release_date":"2025-12-07","tagline":"Rnj-1 is an 8B-parameter, dense, open-weight model family developed by Essential AI and trained from scratch with a focus on programming, math, and scientific reasoning.","tools":["function_calling"],"model_type":"chat"},{"id":"google/gemini-2.0-flash-001","name":"Google: Gemini 2.0 Flash","created_by":"google","source":"official","last_updated":"2026-05-23","family":"gemini-2.0","description":"Gemini Flash 2.0 offers a significantly faster time to first token (TTFT) compared to [Gemini Flash 1.5](/google/gemini-flash-1.5), while maintaining quality on par with larger models like [Gemini Pro 1.5](/google/gemini-pro-1.5).","status":"deprecated","deprecation_date":"2026-06-01","context_window":1000000,"max_output_tokens":8192,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true},"pricing":{"input":0.1,"output":0.4,"cached_input":0.025},"model_type":"chat","release_date":"2025-02-05","tagline":"Gemini Flash 2.0 offers a significantly faster time to first token (TTFT) compared to [Gemini Flash 1.5](/google/gemini-flash-1.5), while maintaining quality on par with larger models like [Gemini Pro","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"google/gemini-2.0-flash-lite-001","name":"Google: Gemini 2.0 Flash Lite","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.0","description":"Gemini 2.0 Flash Lite offers a significantly faster time to first token (TTFT) compared to [Gemini Flash 1.5](/google/gemini-flash-1.5), while maintaining quality on par with larger models like [Gemin","status":"deprecated","deprecation_date":"2026-06-01","context_window":1048576,"max_output_tokens":8192,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true},"pricing":{"input":0.075,"output":0.3},"model_type":"chat","release_date":"2025-02-25","tagline":"Gemini 2.0 Flash Lite offers a significantly faster time to first token (TTFT) compared to [Gemini Flash 1.5](/google/gemini-flash-1.5), while maintaining quality on par with larger models like [Gemin","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"google/gemini-2.5-flash-image","name":"Google: Nano Banana (Gemini 2.5 Flash Image)","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","description":"Gemini 2.5 Flash Image, a.k.a.","context_window":32768,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["image","text"]},"capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"tool_call":true,"reasoning":true,"batch":true,"vision":true},"pricing":{"input":0.3,"output":2.5,"cached_input":0.03},"model_type":"chat","release_date":"2025-10-07","tagline":"Gemini 2.5 Flash Image, a.k.a.","knowledge_cutoff":"2025-06","license":"proprietary","open_weight":false},{"id":"google/gemini-2.5-flash-lite-preview-09-2025","name":"Google: Gemini 2.5 Flash Lite Preview 09-2025","created_by":"google","source":"official","last_updated":"2026-04-03","family":"gemini-2.5","description":"Gemini 2.5 Flash-Lite is a lightweight reasoning model in the Gemini 2.5 family, optimized for ultra-low latency and cost efficiency.","context_window":1048576,"max_output_tokens":65535,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":0.1,"output":0.4,"cached_input":0.01},"model_type":"chat","release_date":"2025-09-25","tagline":"Gemini 2.5 Flash-Lite is a lightweight reasoning model in the Gemini 2.5 family, optimized for ultra-low latency and cost efficiency.","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-2.5-flash-lite","name":"Google: Gemini 2.5 Flash Lite","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.5","description":"Gemini 2.5 Flash-Lite is a lightweight reasoning model in the Gemini 2.5 family, optimized for ultra-low latency and cost efficiency.","context_window":1048576,"max_output_tokens":65535,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":0.1,"output":0.4,"cached_input":0.01},"model_type":"chat","release_date":"2025-07-22","tagline":"Gemini 2.5 Flash-Lite is a lightweight reasoning model in the Gemini 2.5 family, optimized for ultra-low latency and cost efficiency.","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-2.5-flash","name":"Google: Gemini 2.5 Flash","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.5","description":"Gemini 2.5 Flash is Google's state-of-the-art workhorse model, specifically designed for advanced reasoning, coding, mathematics, and scientific tasks.","context_window":1048576,"max_output_tokens":65535,"modalities":{"input":["image","text","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":0.3,"output":2.5,"cached_input":0.03},"model_type":"chat","release_date":"2025-06-17","tagline":"Gemini 2.5 Flash is Google's state-of-the-art workhorse model, specifically designed for advanced reasoning, coding, mathematics, and scientific tasks.","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-2.5-pro-preview-05-06","name":"Google: Gemini 2.5 Pro Preview 05-06","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.5","description":"Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks.","context_window":1048576,"max_output_tokens":65535,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true},"pricing":{"input":1.25,"output":10,"cached_input":0.125},"model_type":"chat","release_date":"2025-05-07","tagline":"Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks.","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"google/gemini-2.5-pro-preview","name":"Google: Gemini 2.5 Pro Preview 06-05","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.5","description":"Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks.","context_window":1048576,"max_output_tokens":65536,"modalities":{"input":["image","text","audio"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":1.25,"output":10,"cached_input":0.125},"model_type":"chat","release_date":"2025-06-05","tagline":"Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks.","tools":["function_calling"]},{"id":"google/gemini-2.5-pro","name":"Google: Gemini 2.5 Pro","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.5","description":"Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks.","context_window":1048576,"max_output_tokens":65536,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":1.25,"output":10,"cached_input":0.125},"model_type":"chat","release_date":"2025-06-17","tagline":"Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks.","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3-flash-preview","name":"Google: Gemini 3 Flash Preview","created_by":"google","source":"official","last_updated":"2026-06-18","family":"gemini-3","description":"Gemini 3 Flash Preview is a high speed, high value thinking model designed for agentic workflows, multi turn chat, and coding assistance.","context_window":1048576,"max_output_tokens":65535,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":0.5,"output":3,"cached_input":0.05},"model_type":"chat","release_date":"2025-12-17","tagline":"Gemini 3 Flash Preview is a high speed, high value thinking model designed for agentic workflows, multi turn chat, and coding assistance.","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3-pro-image-preview","name":"Google: Nano Banana Pro (Gemini 3 Pro Image Preview)","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-3","description":"Nano Banana Pro is Google’s most advanced image-generation and editing model, built on Gemini 3 Pro.","context_window":65536,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["image","text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"tool_call":true,"batch":true,"vision":true},"pricing":{"input":2,"output":12,"cached_input":0.2},"model_type":"chat","release_date":"2025-11-20","tagline":"Nano Banana Pro is Google’s most advanced image-generation and editing model, built on Gemini 3 Pro.","knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3-pro-image","name":"Google: Nano Banana Pro (Gemini 3 Pro Image)","created_by":"google","source":"official","family":"gemini-3","description":"Nano Banana Pro is Google’s most advanced image-generation and editing model, built on Gemini 3 Pro.","release_date":"2026-06-18","context_window":65536,"max_output_tokens":32768,"model_type":"chat","tagline":"Nano Banana Pro is Google’s most advanced image-generation and editing model, built on Gemini 3 Pro.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"modalities":{"input":["image","text"],"output":["image","text"]},"pricing":{"input":2,"output":12,"cached_input":0.2},"tools":["function_calling"],"last_updated":"2026-06-18","knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3-pro-preview","name":"Google: Gemini 3 Pro Preview","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-3","description":"Gemini 3 Pro is Google’s flagship frontier model for high-precision multimodal reasoning, combining strong performance across text, image, video, audio, and code with a 1M-token context window.","status":"deprecated","deprecation_date":"2026-03-26","context_window":1048576,"max_output_tokens":65536,"modalities":{"input":["text","image","audio","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":2,"output":12,"cached_input":0.2},"model_type":"chat","release_date":"2025-11-18","tagline":"Gemini 3 Pro is Google’s flagship frontier model for high-precision multimodal reasoning, combining strong performance across text, image, video, audio, and code with a 1M-token context window.","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3.1-flash-image-preview","name":"Google: Nano Banana 2 (Gemini 3.1 Flash Image Preview)","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3.1","description":"Gemini 3.1 Flash Image Preview, a.k.a.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["image","text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"tool_call":true,"batch":true,"vision":true},"pricing":{"input":0.5,"output":3},"model_type":"chat","release_date":"2026-02-26","tagline":"Gemini 3.1 Flash Image Preview, a.k.a.","knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3.1-flash-image","name":"Google: Nano Banana 2 (Gemini 3.1 Flash Image)","created_by":"google","source":"official","family":"gemini-3.1","description":"Gemini 3.1 Flash Image, a.k.a.","release_date":"2026-06-18","context_window":131072,"max_output_tokens":32768,"model_type":"chat","tagline":"Gemini 3.1 Flash Image, a.k.a.","capabilities":{"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"tool_call":true,"batch":true,"vision":true},"modalities":{"input":["image","text"],"output":["image","text"]},"pricing":{"input":0.5,"output":3},"last_updated":"2026-06-29","knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3.1-flash-lite-preview","name":"Google: Gemini 3.1 Flash Lite Preview","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-3.1","description":"Gemini 3.1 Flash Lite Preview is Google's high-efficiency model optimized for high-volume use cases.","context_window":1048576,"max_output_tokens":65536,"modalities":{"input":["text","image","video","audio"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":0.25,"output":1.5,"cached_input":0.025},"model_type":"chat","release_date":"2026-03-03","tagline":"Gemini 3.1 Flash Lite Preview is Google's high-efficiency model optimized for high-volume use cases.","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3.1-flash-lite","name":"Google: Gemini 3.1 Flash Lite","created_by":"google","source":"official","family":"gemini-3.1","description":"Gemini 3.1 Flash Lite is Google’s GA high-efficiency multimodal model optimized for low-latency, high-volume workloads.","release_date":"2026-05-07","context_window":1048576,"max_output_tokens":65536,"model_type":"chat","tagline":"Gemini 3.1 Flash Lite is Google’s GA high-efficiency multimodal model optimized for low-latency, high-volume workloads.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"pricing":{"input":0.25,"output":1.5,"cached_input":0.025},"tools":["function_calling"],"last_updated":"2026-05-10","knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3.1-pro-preview-customtools","name":"Google: Gemini 3.1 Pro Preview Custom Tools","created_by":"google","source":"official","last_updated":"2026-05-17","family":"gemini-3.1","description":"Gemini 3.1 Pro Preview Custom Tools is a variant of Gemini 3.1 Pro that improves tool selection behavior by preventing overuse of a general bash tool when more efficient third-party...","context_window":1048756,"max_output_tokens":65536,"modalities":{"input":["text","audio","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":2,"output":12,"cached_input":0.2},"model_type":"chat","release_date":"2026-02-25","tagline":"Gemini 3.1 Pro Preview Custom Tools is a variant of Gemini 3.1 Pro that improves tool selection behavior by preventing overuse of a general bash tool when more efficient third-party or user-defined fu","tools":["function_calling"]},{"id":"google/gemini-3.1-pro-preview","name":"Google: Gemini 3.1 Pro Preview","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-3.1","description":"Gemini 3.1 Pro Preview is Google’s frontier reasoning model, delivering enhanced software engineering performance, improved agentic reliability, and more efficient token usage across complex workflows.","context_window":1048576,"max_output_tokens":65536,"modalities":{"input":["audio","image","text","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"pricing":{"input":2,"output":12,"cached_input":0.2},"model_type":"chat","release_date":"2026-02-19","tagline":"Gemini 3.1 Pro Preview is Google’s frontier reasoning model, delivering enhanced software engineering performance, improved agentic reliability, and more efficient token usage across complex workflows","tools":["function_calling"],"knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemini-3.5-flash","name":"Google: Gemini 3.5 Flash","created_by":"google","source":"official","family":"gemini-3.5","description":"Gemini 3.5 Flash is Google's high-efficiency multimodal model, bringing near-Pro level coding and reasoning at Flash-tier cost and speed.","release_date":"2026-05-19","context_window":1048576,"max_output_tokens":65536,"model_type":"chat","tagline":"Gemini 3.5 Flash is Google's high-efficiency multimodal model, bringing near-Pro level coding and reasoning at Flash-tier cost and speed.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"pricing":{"input":1.5,"output":9,"cached_input":0.15},"tools":["function_calling"],"last_updated":"2026-05-23","knowledge_cutoff":"2025-01","license":"proprietary","open_weight":false},{"id":"google/gemma-2-27b-it","name":"Google: Gemma 2 27B","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-2","description":"Gemma 2 27B by Google is an open model built from the same research and technology used to create the [Gemini models](/models?q=gemini).","context_window":8192,"max_output_tokens":2048,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.65,"output":0.65},"model_type":"chat","parameters":27,"release_date":"2024-07-13","tagline":"Gemma 2 27B by Google is an open model built from the same research and technology used to create the [Gemini models](/models?q=gemini)."},{"id":"google/gemma-2-9b-it","name":"Google: Gemma 2 9B","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemma-2","description":"Gemma 2 9B by Google is an advanced, open-source language model that sets a new standard for efficiency and performance in its size class.","context_window":8192,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.03,"output":0.09},"model_type":"chat","parameters":9,"release_date":"2024-06-28","tagline":"Gemma 2 9B by Google is an advanced, open-source language model that sets a new standard for efficiency and performance in its size class."},{"id":"google/gemma-3-12b-it:free","name":"Google: Gemma 3 12B (free)","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","context_window":32768,"max_output_tokens":8192,"modalities":{"input":["text","image"],"output":["text"]},"model_type":"chat","parameters":12,"release_date":"2025-03-13","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs."},{"id":"google/gemma-3-12b-it","name":"Google: Gemma 3 12B","created_by":"google","source":"official","last_updated":"2026-06-10","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","context_window":131072,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"tool_call":true},"pricing":{"input":0.05,"output":0.15},"model_type":"chat","parameters":12,"release_date":"2025-03-13","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","max_output_tokens":16384,"tools":["function_calling"]},{"id":"google/gemma-3-27b-it:free","name":"Google: Gemma 3 27B (free)","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","context_window":131072,"max_output_tokens":8192,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"model_type":"chat","parameters":27,"release_date":"2025-03-12","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs."},{"id":"google/gemma-3-27b-it","name":"Google: Gemma 3 27B","created_by":"google","source":"official","last_updated":"2026-04-25","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"tool_call":true},"pricing":{"input":0.08,"output":0.16},"model_type":"chat","parameters":27,"release_date":"2025-03-12","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","tools":["function_calling"]},{"id":"google/gemma-3-4b-it:free","name":"Google: Gemma 3 4B (free)","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","context_window":32768,"max_output_tokens":8192,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"model_type":"chat","parameters":4,"release_date":"2025-03-13","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs."},{"id":"google/gemma-3-4b-it","name":"Google: Gemma 3 4B","created_by":"google","source":"official","last_updated":"2026-06-10","family":"gemma-3","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","context_window":131072,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.05,"output":0.1},"model_type":"chat","parameters":4,"release_date":"2025-03-13","tagline":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","max_output_tokens":16384},{"id":"google/gemma-3n-e2b-it:free","name":"Google: Gemma 3n 2B (free)","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-3n","description":"Gemma 3n E2B IT is a multimodal, instruction-tuned model developed by Google DeepMind, designed to operate efficiently at an effective parameter size of 2B while leveraging a 6B architecture.","context_window":8192,"max_output_tokens":2048,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"model_type":"chat","release_date":"2025-07-09","tagline":"Gemma 3n E2B IT is a multimodal, instruction-tuned model developed by Google DeepMind, designed to operate efficiently at an effective parameter size of 2B while leveraging a 6B architecture."},{"id":"google/gemma-3n-e4b-it:free","name":"Google: Gemma 3n 4B (free)","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemma-3n","description":"Gemma 3n E4B-it is optimized for efficient execution on mobile and low-resource devices, such as phones, laptops, and tablets.","context_window":8192,"max_output_tokens":2048,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"model_type":"chat","release_date":"2025-05-20","tagline":"Gemma 3n E4B-it is optimized for efficient execution on mobile and low-resource devices, such as phones, laptops, and tablets."},{"id":"google/gemma-3n-e4b-it","name":"Google: Gemma 3n 4B","created_by":"google","source":"official","last_updated":"2026-06-18","family":"gemma-3n","description":"Gemma 3n E4B-it is optimized for efficient execution on mobile and low-resource devices, such as phones, laptops, and tablets.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.06,"output":0.12},"model_type":"chat","release_date":"2025-05-20","tagline":"Gemma 3n E4B-it is optimized for efficient execution on mobile and low-resource devices, such as phones, laptops, and tablets.","capabilities":{"structured_output":true,"json_mode":true}},{"id":"google/gemma-4-26b-a4b-it:free","name":"Google: Gemma 4 26B A4B (free)","created_by":"google","source":"official","family":"gemma-4","description":"Gemma 4 26B A4B IT is an instruction-tuned Mixture-of-Experts (MoE) model from Google DeepMind.","release_date":"2026-04-03","context_window":262144,"max_output_tokens":32768,"parameters":26,"active_parameters":4,"model_type":"chat","tagline":"Gemma 4 26B A4B IT is an instruction-tuned Mixture-of-Experts (MoE) model from Google DeepMind.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["image","text","video"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-08"},{"id":"google/gemma-4-26b-a4b-it","name":"Google: Gemma 4 26B A4B ","created_by":"google","source":"official","family":"gemma-4","description":"Gemma 4 26B A4B IT is an instruction-tuned Mixture-of-Experts (MoE) model from Google DeepMind.","release_date":"2026-04-03","context_window":262144,"max_output_tokens":16384,"parameters":26,"active_parameters":4,"model_type":"chat","tagline":"Gemma 4 26B A4B IT is an instruction-tuned Mixture-of-Experts (MoE) model from Google DeepMind.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["image","text","video"],"output":["text"]},"pricing":{"input":0.06,"output":0.33,"cached_input":0.04},"tools":["function_calling"],"last_updated":"2026-05-23"},{"id":"google/gemma-4-31b-it:free","name":"Google: Gemma 4 31B (free)","created_by":"google","source":"official","family":"gemma-4","description":"Gemma 4 31B Instruct is Google DeepMind's 30.7B dense multimodal model supporting text and image input with text output.","release_date":"2026-04-02","context_window":262144,"max_output_tokens":8192,"parameters":31,"model_type":"chat","tagline":"Gemma 4 31B Instruct is Google DeepMind's 30.7B dense multimodal model supporting text and image input with text output.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["image","text","video"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-18"},{"id":"google/gemma-4-31b-it","name":"Google: Gemma 4 31B","created_by":"google","source":"official","family":"gemma-4","description":"Gemma 4 31B Instruct is Google DeepMind's 30.7B dense multimodal model supporting text and image input with text output.","release_date":"2026-04-02","context_window":262144,"max_output_tokens":262144,"parameters":31,"model_type":"chat","tagline":"Gemma 4 31B Instruct is Google DeepMind's 30.7B dense multimodal model supporting text and image input with text output.","capabilities":{"structured_output":true,"reasoning":true,"json_mode":true,"tool_call":true},"modalities":{"input":["image","text","video"],"output":["text"]},"pricing":{"input":0.12,"output":0.35,"cached_input":0.09},"last_updated":"2026-06-18","tools":["function_calling"]},{"id":"google/lyria-3-clip-preview","name":"Google: Lyria 3 Clip Preview","created_by":"google","source":"official","description":"30 second duration clips are priced at $0.04 per clip.","release_date":"2026-03-30","context_window":1048576,"max_output_tokens":65536,"model_type":"tts","tagline":"30 second duration clips are priced at $0.04 per clip.","capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"tool_call":true,"reasoning":true,"batch":true,"vision":true},"modalities":{"input":["text","image"],"output":["text","audio"]},"last_updated":"2026-04-01","license":"proprietary","open_weight":false},{"id":"google/lyria-3-pro-preview","name":"Google: Lyria 3 Pro Preview","created_by":"google","source":"official","description":"Full-length songs are priced at $0.08 per song.","release_date":"2026-03-30","context_window":1048576,"max_output_tokens":65536,"model_type":"tts","tagline":"Full-length songs are priced at $0.08 per song.","capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"tool_call":true,"reasoning":true,"batch":true,"vision":true},"modalities":{"input":["text","image"],"output":["text","audio"]},"last_updated":"2026-04-01","license":"proprietary","open_weight":false},{"id":"gryphe/mythomax-l2-13b","name":"MythoMax 13B","created_by":"gryphe","source":"official","last_updated":"2026-03-24","description":"One of the highest performing and most popular fine-tunes of Llama 2 13B, with rich descriptions and roleplay.","context_window":4096,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.06,"output":0.06},"parameters":13,"release_date":"2023-07-02","tagline":"One of the highest performing and most popular fine-tunes of Llama 2 13B, with rich descriptions and roleplay."},{"id":"ibm-granite/granite-4.0-h-micro","name":"IBM: Granite 4.0 Micro","created_by":"ibm-granite","source":"official","last_updated":"2026-06-18","description":"Granite-4.0-H-Micro is a 3B parameter from the Granite 4 family of models.","context_window":131000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.017,"output":0.112},"release_date":"2025-10-20","tagline":"Granite-4.0-H-Micro is a 3B parameter from the Granite 4 family of models.","model_type":"chat","max_output_tokens":131000,"capabilities":{"structured_output":true,"json_mode":true}},{"id":"ibm-granite/granite-4.1-8b","name":"IBM: Granite 4.1 8B","created_by":"ibm-granite","source":"official","description":"Granite 4.1 8B is a dense, decoder-only 8-billion-parameter language model from IBM, part of the Granite 4.1 family.","release_date":"2026-04-30","context_window":131072,"max_output_tokens":131072,"parameters":8,"model_type":"chat","tagline":"Granite 4.1 8B is a dense, decoder-only 8-billion-parameter language model from IBM, part of the Granite 4.1 family.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.05,"output":0.1,"cached_input":0.05},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"inception/mercury-2","name":"Inception: Mercury 2","created_by":"inception","source":"official","last_updated":"2026-03-24","description":"Mercury 2 is an extremely fast reasoning LLM, and the first reasoning diffusion LLM (dLLM).","context_window":128000,"max_output_tokens":50000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true},"pricing":{"input":0.25,"output":0.75,"cached_input":0.025},"release_date":"2026-03-04","tagline":"Mercury 2 is an extremely fast reasoning LLM, and the first reasoning diffusion LLM (dLLM).","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"inception/mercury-coder","name":"Inception: Mercury Coder","created_by":"inception","source":"official","last_updated":"2026-04-03","description":"Mercury Coder is the first diffusion large language model (dLLM).","context_window":128000,"max_output_tokens":32000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true},"pricing":{"input":0.25,"output":0.75,"cached_input":0.025},"release_date":"2025-04-30","tagline":"Mercury Coder is the first diffusion large language model (dLLM).","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-04-15","license":"proprietary","open_weight":false},{"id":"inception/mercury","name":"Inception: Mercury","created_by":"inception","source":"official","last_updated":"2026-03-24","description":"Mercury is the first diffusion large language model (dLLM).","status":"deprecated","deprecation_date":"2026-04-15","context_window":128000,"max_output_tokens":32000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true},"pricing":{"input":0.25,"output":0.75,"cached_input":0.025},"release_date":"2025-06-26","tagline":"Mercury is the first diffusion large language model (dLLM).","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"inclusionai/ling-2.6-1t:free","name":"inclusionAI: Ling-2.6-1T (free)","created_by":"inclusionai","source":"official","description":"Ling-2.6-1T is an instant (instruct) model from inclusionAI and the company’s trillion-parameter flagship, designed for real-world agents that require fast execution and high efficiency at scale.","status":"deprecated","release_date":"2026-04-23","deprecation_date":"2026-05-07","context_window":262144,"max_output_tokens":32768,"tagline":"Ling-2.6-1T is an instant (instruct) model from inclusionAI and the company’s trillion-parameter flagship, designed for real-world agents that require fast execution and high efficiency at scale.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"inclusionai/ling-2.6-1t","name":"inclusionAI: Ling-2.6-1T","created_by":"inclusionai","source":"official","description":"Ling-2.6-1T is an instant (instruct) model from inclusionAI and the company’s trillion-parameter flagship, designed for real-world agents that require fast execution and high efficiency at scale.","release_date":"2026-04-23","context_window":262144,"max_output_tokens":32768,"tagline":"Ling-2.6-1T is an instant (instruct) model from inclusionAI and the company’s trillion-parameter flagship, designed for real-world agents that require fast execution and high efficiency at scale.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.075,"output":0.625,"cached_input":0.015},"tools":["function_calling"],"last_updated":"2026-05-23"},{"id":"inclusionai/ling-2.6-flash:free","name":"inclusionAI: Ling-2.6-flash (free)","created_by":"inclusionai","source":"official","description":"Ling-2.6-flash is an instant (instruct) model from inclusionAI with 104B total parameters and 7.4B active parameters, designed for real-world agents that require fast responses, strong execution, and ","release_date":"2026-04-21","context_window":262144,"max_output_tokens":32768,"tagline":"Ling-2.6-flash is an instant (instruct) model from inclusionAI with 104B total parameters and 7.4B active parameters, designed for real-world agents that require fast responses, strong execution, and ","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-24","status":"deprecated","deprecation_date":"2026-04-29"},{"id":"inclusionai/ling-2.6-flash","name":"inclusionAI: Ling-2.6-flash","created_by":"inclusionai","source":"official","description":"Ling-2.6-flash is an instant (instruct) model from inclusionAI with 104B total parameters and 7.4B active parameters, designed for real-world agents that require fast responses, strong execution, and ","release_date":"2026-04-21","context_window":262144,"max_output_tokens":32768,"tagline":"Ling-2.6-flash is an instant (instruct) model from inclusionAI with 104B total parameters and 7.4B active parameters, designed for real-world agents that require fast responses, strong execution, and ","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.01,"output":0.03,"cached_input":0.002},"tools":["function_calling"],"last_updated":"2026-05-17"},{"id":"inclusionai/ring-2.6-1t:free","name":"inclusionAI: Ring-2.6-1T (free)","created_by":"inclusionai","source":"official","description":"Ring-2.6-1T is a 1T-parameter-scale thinking model with 63B active parameters, built for real-world agent workflows that require both strong capability and operational efficiency.","release_date":"2026-05-08","context_window":262144,"max_output_tokens":65536,"tagline":"Ring-2.6-1T is a 1T-parameter-scale thinking model with 63B active parameters, built for real-world agent workflows that require both strong capability and operational efficiency.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-10"},{"id":"inclusionai/ring-2.6-1t","name":"inclusionAI: Ring-2.6-1T","created_by":"inclusionai","source":"official","description":"Ring-2.6-1T is a 1T-parameter-scale thinking model with 63B active parameters, built for real-world agent workflows that require both strong capability and operational efficiency.","release_date":"2026-05-08","context_window":262144,"max_output_tokens":65536,"tagline":"Ring-2.6-1T is a 1T-parameter-scale thinking model with 63B active parameters, built for real-world agent workflows that require both strong capability and operational efficiency.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.075,"output":0.625,"cached_input":0.015},"tools":["function_calling"],"last_updated":"2026-06-03"},{"id":"inflection/inflection-3-pi","name":"Inflection: Inflection 3 Pi","created_by":"inflection","source":"official","last_updated":"2026-03-23","description":"Inflection 3 Pi powers Inflection's [Pi](https://pi.ai) chatbot, including backstory, emotional intelligence, productivity, and safety.","context_window":8000,"max_output_tokens":1024,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":2.5,"output":10},"release_date":"2024-10-11","tagline":"Inflection 3 Pi powers Inflection's [Pi](https://pi.ai) chatbot, including backstory, emotional intelligence, productivity, and safety."},{"id":"inflection/inflection-3-productivity","name":"Inflection: Inflection 3 Productivity","created_by":"inflection","source":"official","last_updated":"2026-03-23","description":"Inflection 3 Productivity is optimized for following instructions.","context_window":8000,"max_output_tokens":1024,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":2.5,"output":10},"release_date":"2024-10-11","tagline":"Inflection 3 Productivity is optimized for following instructions."},{"id":"kwaipilot/kat-coder-pro-v2","name":"Kwaipilot: KAT-Coder-Pro V2","created_by":"kwaipilot","source":"official","description":"KAT-Coder-Pro V2 is the latest high-performance model in KwaiKAT’s KAT-Coder series, designed for complex enterprise-grade software engineering and SaaS integration.","release_date":"2026-03-27","context_window":256000,"max_output_tokens":80000,"tagline":"KAT-Coder-Pro V2 is the latest high-performance model in KwaiKAT’s KAT-Coder series, designed for complex enterprise-grade software engineering and SaaS integration.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.3,"output":1.2,"cached_input":0.06},"tools":["function_calling"],"last_updated":"2026-04-01"},{"id":"kwaipilot/kat-coder-pro","name":"Kwaipilot: KAT-Coder-Pro V1","created_by":"kwaipilot","source":"official","last_updated":"2026-03-24","description":"KAT-Coder-Pro V1 is KwaiKAT's most advanced agentic coding model in the KAT-Coder series.","context_window":256000,"max_output_tokens":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.207,"output":0.828,"cached_input":0.041},"release_date":"2025-11-10","tagline":"KAT-Coder-Pro V1 is KwaiKAT's most advanced agentic coding model in the KAT-Coder series.","tools":["function_calling"]},{"id":"liquid/lfm-2-24b-a2b","name":"LiquidAI: LFM2-24B-A2B","created_by":"liquid","source":"official","last_updated":"2026-06-18","description":"LFM2-24B-A2B is the largest model in the LFM2 family of hybrid architectures designed for efficient on-device deployment.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.03,"output":0.12},"parameters":24,"active_parameters":2,"release_date":"2026-02-25","tagline":"LFM2-24B-A2B is the largest model in the LFM2 family of hybrid architectures designed for efficient on-device deployment.","model_type":"chat","capabilities":{"structured_output":true,"json_mode":true}},{"id":"liquid/lfm-2.2-6b","name":"LiquidAI: LFM2-2.6B","created_by":"liquid","source":"official","last_updated":"2026-03-23","description":"LFM2 is a new generation of hybrid models developed by Liquid AI, specifically designed for edge AI and on-device deployment.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.01,"output":0.02},"parameters":6,"release_date":"2025-10-20","tagline":"LFM2 is a new generation of hybrid models developed by Liquid AI, specifically designed for edge AI and on-device deployment.","model_type":"chat"},{"id":"liquid/lfm-2.5-1.2b-instruct:free","name":"LiquidAI: LFM2.5-1.2B-Instruct (free)","created_by":"liquid","source":"official","last_updated":"2026-06-18","description":"LFM2.5-1.2B-Instruct is a compact, high-performance instruction-tuned model built for fast on-device AI.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"parameters":1.2,"release_date":"2026-01-20","tagline":"LFM2.5-1.2B-Instruct is a compact, high-performance instruction-tuned model built for fast on-device AI.","model_type":"chat","capabilities":{"structured_output":true,"json_mode":true}},{"id":"liquid/lfm-2.5-1.2b-thinking:free","name":"LiquidAI: LFM2.5-1.2B-Thinking (free)","created_by":"liquid","source":"official","last_updated":"2026-06-18","description":"LFM2.5-1.2B-Thinking is a lightweight reasoning-focused model optimized for agentic tasks, data extraction, and RAG—while still running comfortably on edge devices.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"reasoning":true,"tool_call":true,"structured_output":true,"json_mode":true},"parameters":1.2,"release_date":"2026-01-20","tagline":"LFM2.5-1.2B-Thinking is a lightweight reasoning-focused model optimized for agentic tasks, data extraction, and RAG—while still running comfortably on edge devices.","model_type":"chat","tools":["function_calling"]},{"id":"liquid/lfm2-8b-a1b","name":"LiquidAI: LFM2-8B-A1B","created_by":"liquid","source":"official","last_updated":"2026-03-23","description":"LFM2-8B-A1B is an efficient on-device Mixture-of-Experts (MoE) model from Liquid AI’s LFM2 family, built for fast, high-quality inference on edge hardware.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.01,"output":0.02},"parameters":8,"active_parameters":1,"release_date":"2025-10-20","tagline":"LFM2-8B-A1B is an efficient on-device Mixture-of-Experts (MoE) model from Liquid AI’s LFM2 family, built for fast, high-quality inference on edge hardware.","model_type":"chat"},{"id":"mancer/weaver","name":"Mancer: Weaver (alpha)","created_by":"mancer","source":"official","last_updated":"2026-03-24","description":"An attempt to recreate Claude-style verbosity, but don't expect the same level of coherence or memory.","context_window":8000,"max_output_tokens":2000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.75,"output":1},"release_date":"2023-08-02","tagline":"An attempt to recreate Claude-style verbosity, but don't expect the same level of coherence or memory."},{"id":"meituan/longcat-flash-chat","name":"Meituan: LongCat Flash Chat","created_by":"meituan","source":"official","last_updated":"2026-03-24","description":"LongCat-Flash-Chat is a large-scale Mixture-of-Experts (MoE) model with 560B total parameters, of which 18.6B–31.3B (≈27B on average) are dynamically activated per input.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.2,"output":0.8,"cached_input":0.2},"release_date":"2025-09-09","tagline":"LongCat-Flash-Chat is a large-scale Mixture-of-Experts (MoE) model with 560B total parameters, of which 18.6B–31.3B (≈27B on average) are dynamically activated per input.","tools":["function_calling"]},{"id":"meta-llama/llama-3-70b-instruct","name":"Meta: Llama 3 70B Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-06-10","family":"llama-3","description":"Meta's latest class of model (Llama 3) launched with a variety of sizes & flavors.","context_window":8192,"max_output_tokens":8000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.51,"output":0.74},"model_type":"chat","parameters":70,"release_date":"2024-04-18","tagline":"Meta's latest class of model (Llama 3) launched with a variety of sizes & flavors.","status":"deprecated","deprecation_date":"2026-06-19"},{"id":"meta-llama/llama-3-8b-instruct","name":"Meta: Llama 3 8B Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-06-10","family":"llama-3","description":"Meta's latest class of model (Llama 3) launched with a variety of sizes & flavors.","context_window":8192,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.14,"output":0.14},"model_type":"chat","parameters":8,"release_date":"2024-04-18","tagline":"Meta's latest class of model (Llama 3) launched with a variety of sizes & flavors.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-07"},{"id":"meta-llama/llama-3.1-405b","name":"Meta: Llama 3.1 405B (base)","created_by":"meta-llama","source":"official","last_updated":"2026-03-23","family":"llama-3.1","description":"Meta's latest class of model (Llama 3.1) launched with a variety of sizes & flavors.","context_window":32768,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":4,"output":4},"model_type":"chat","parameters":405,"release_date":"2024-08-02","tagline":"Meta's latest class of model (Llama 3.1) launched with a variety of sizes & flavors."},{"id":"meta-llama/llama-3.1-70b-instruct","name":"Meta: Llama 3.1 70B Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-04-25","family":"llama-3.1","description":"Meta's latest class of model (Llama 3.1) launched with a variety of sizes & flavors.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.4,"output":0.4},"model_type":"chat","parameters":70,"release_date":"2024-07-23","tagline":"Meta's latest class of model (Llama 3.1) launched with a variety of sizes & flavors.","tools":["function_calling"],"max_output_tokens":16384},{"id":"meta-llama/llama-3.1-8b-instruct","name":"Meta: Llama 3.1 8B Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-06-10","family":"llama-3.1","description":"Meta's latest class of model (Llama 3.1) launched with a variety of sizes & flavors.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.02,"output":0.03},"model_type":"chat","parameters":8,"release_date":"2024-07-23","tagline":"Meta's latest class of model (Llama 3.1) launched with a variety of sizes & flavors.","tools":["function_calling"]},{"id":"meta-llama/llama-3.2-11b-vision-instruct","name":"Meta: Llama 3.2 11B Vision Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-06-10","family":"llama-3.2","description":"Llama 3.2 11B Vision is a multimodal model with 11 billion parameters, designed to handle tasks combining visual and textual data.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.345,"output":0.345},"model_type":"chat","parameters":11,"release_date":"2024-09-25","tagline":"Llama 3.2 11B Vision is a multimodal model with 11 billion parameters, designed to handle tasks combining visual and textual data."},{"id":"meta-llama/llama-3.2-1b-instruct","name":"Meta: Llama 3.2 1B Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-05-23","family":"llama-3.2","description":"Llama 3.2 1B is a 1-billion-parameter language model focused on efficiently performing natural language tasks, such as summarization, dialogue, and multilingual text analysis.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.027,"output":0.201},"model_type":"chat","parameters":1,"release_date":"2024-09-25","tagline":"Llama 3.2 1B is a 1-billion-parameter language model focused on efficiently performing natural language tasks, such as summarization, dialogue, and multilingual text analysis.","max_output_tokens":60000},{"id":"meta-llama/llama-3.2-3b-instruct:free","name":"Meta: Llama 3.2 3B Instruct (free)","created_by":"meta-llama","source":"official","last_updated":"2026-03-23","family":"llama-3.2","description":"Llama 3.2 3B is a 3-billion-parameter multilingual large language model, optimized for advanced natural language processing tasks like dialogue generation, reasoning, and summarization.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"model_type":"chat","parameters":3,"release_date":"2024-09-25","tagline":"Llama 3.2 3B is a 3-billion-parameter multilingual large language model, optimized for advanced natural language processing tasks like dialogue generation, reasoning, and summarization."},{"id":"meta-llama/llama-3.2-3b-instruct","name":"Meta: Llama 3.2 3B Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-05-23","family":"llama-3.2","description":"Llama 3.2 3B is a 3-billion-parameter multilingual large language model, optimized for advanced natural language processing tasks like dialogue generation, reasoning, and summarization.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.051,"output":0.335},"model_type":"chat","parameters":3,"release_date":"2024-09-25","tagline":"Llama 3.2 3B is a 3-billion-parameter multilingual large language model, optimized for advanced natural language processing tasks like dialogue generation, reasoning, and summarization.","max_output_tokens":80000},{"id":"meta-llama/llama-3.3-70b-instruct:free","name":"Meta: Llama 3.3 70B Instruct (free)","created_by":"meta-llama","source":"official","last_updated":"2026-05-17","family":"llama-3.3","description":"The Meta Llama 3.3 multilingual large language model (LLM) is a pretrained and instruction tuned generative model in 70B (text in/text out).","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true},"model_type":"chat","parameters":70,"release_date":"2024-12-06","tagline":"The Meta Llama 3.3 multilingual large language model (LLM) is a pretrained and instruction tuned generative model in 70B (text in/text out).","tools":["function_calling"]},{"id":"meta-llama/llama-3.3-70b-instruct","name":"Meta: Llama 3.3 70B Instruct","created_by":"meta-llama","source":"official","last_updated":"2026-04-22","family":"llama-3.3","description":"The Meta Llama 3.3 multilingual large language model (LLM) is a pretrained and instruction tuned generative model in 70B (text in/text out).","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.1,"output":0.32},"model_type":"chat","parameters":70,"release_date":"2024-12-06","tagline":"The Meta Llama 3.3 multilingual large language model (LLM) is a pretrained and instruction tuned generative model in 70B (text in/text out).","tools":["function_calling"]},{"id":"meta-llama/llama-4-maverick","name":"Meta: Llama 4 Maverick","created_by":"meta-llama","source":"official","last_updated":"2026-04-07","family":"llama-4","description":"Llama 4 Maverick 17B Instruct (128E) is a high-capacity multimodal language model from Meta, built on a mixture-of-experts (MoE) architecture with 128 experts and 17 billion active parameters per forw","context_window":1048576,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.15,"output":0.6},"model_type":"chat","release_date":"2025-04-05","tagline":"Llama 4 Maverick 17B Instruct (128E) is a high-capacity multimodal language model from Meta, built on a mixture-of-experts (MoE) architecture with 128 experts and 17 billion active parameters per forw","tools":["function_calling"]},{"id":"meta-llama/llama-4-scout","name":"Meta: Llama 4 Scout","created_by":"meta-llama","source":"official","last_updated":"2026-06-10","family":"llama-4","description":"Llama 4 Scout 17B Instruct (16E) is a mixture-of-experts (MoE) language model developed by Meta, activating 17 billion parameters out of a total of 109B.","context_window":10000000,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.1,"output":0.3},"model_type":"chat","release_date":"2025-04-05","tagline":"Llama 4 Scout 17B Instruct (16E) is a mixture-of-experts (MoE) language model developed by Meta, activating 17 billion parameters out of a total of 109B.","tools":["function_calling"]},{"id":"meta-llama/llama-guard-3-8b","name":"Llama Guard 3 8B","created_by":"meta-llama","source":"official","last_updated":"2026-05-23","family":"llama-guard","description":"Llama Guard 3 is a Llama-3.1-8B pretrained model, fine-tuned for content safety classification.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.484,"output":0.03},"model_type":"moderation","parameters":8,"release_date":"2025-02-12","tagline":"Llama Guard 3 is a Llama-3.1-8B pretrained model, fine-tuned for content safety classification.","max_output_tokens":131072},{"id":"meta-llama/llama-guard-4-12b:free","name":"Meta: Llama Guard 4 12B (free)","created_by":"meta-llama","source":"official","family":"llama-guard","description":"Llama Guard 4 is a Llama 4 Scout-derived multimodal pretrained model, fine-tuned for content safety classification.","release_date":"2025-04-30","context_window":163840,"max_output_tokens":65000,"model_type":"chat","tagline":"Llama Guard 4 is a Llama 4 Scout-derived multimodal pretrained model, fine-tuned for content safety classification.","modalities":{"input":["image","text"],"output":["text"]},"last_updated":"2026-04-16"},{"id":"meta-llama/llama-guard-4-12b","name":"Meta: Llama Guard 4 12B","created_by":"meta-llama","source":"official","last_updated":"2026-04-25","family":"llama-guard","description":"Llama Guard 4 is a Llama 4 Scout-derived multimodal pretrained model, fine-tuned for content safety classification.","context_window":163840,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.18,"output":0.18},"model_type":"moderation","parameters":12,"release_date":"2025-04-30","tagline":"Llama Guard 4 is a Llama 4 Scout-derived multimodal pretrained model, fine-tuned for content safety classification.","max_output_tokens":16384},{"id":"microsoft/phi-4-mini-instruct","name":"Microsoft: Phi 4 Mini Instruct","created_by":"microsoft","source":"official","description":"Phi-4-mini-instruct is a lightweight open model built upon synthetic data and filtered publicly available websites - with a focus on high-quality, reasoning dense data.","release_date":"2025-10-17","context_window":131072,"max_output_tokens":128000,"model_type":"chat","tagline":"Phi-4-mini-instruct is a lightweight open model built upon synthetic data and filtered publicly available websites - with a focus on high-quality, reasoning dense data.","capabilities":{"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.08,"output":0.35,"cached_input":0.08},"last_updated":"2026-05-17"},{"id":"microsoft/phi-4","name":"Microsoft: Phi 4","created_by":"microsoft","source":"official","last_updated":"2026-06-29","description":"[Microsoft Research](/microsoft) Phi-4 is designed to perform well in complex reasoning tasks and can operate efficiently in situations with limited memory or where quick responses are needed.","context_window":16384,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.07,"output":0.14},"release_date":"2025-01-10","tagline":"[Microsoft Research](/microsoft) Phi-4 is designed to perform well in complex reasoning tasks and can operate efficiently in situations with limited memory or where quick responses are needed.","model_type":"chat"},{"id":"microsoft/wizardlm-2-8x22b","name":"WizardLM-2 8x22B","created_by":"microsoft","source":"official","last_updated":"2026-05-17","description":"WizardLM-2 8x22B is Microsoft AI's most advanced Wizard model.","context_window":65536,"max_output_tokens":8000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.62,"output":0.62},"release_date":"2024-04-16","tagline":"WizardLM-2 8x22B is Microsoft AI's most advanced Wizard model.","capabilities":{"structured_output":true,"json_mode":true}},{"id":"minimax/minimax-01","name":"MiniMax: MiniMax-01","created_by":"minimax","source":"official","last_updated":"2026-03-23","description":"MiniMax-01 is a combines MiniMax-Text-01 for text generation and MiniMax-VL-01 for image understanding.","context_window":1000192,"max_output_tokens":1000192,"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":1.1},"model_type":"chat","family":"minimax","release_date":"2025-01-15","tagline":"MiniMax-01 is a combines MiniMax-Text-01 for text generation and MiniMax-VL-01 for image understanding."},{"id":"minimax/minimax-m1","name":"MiniMax: MiniMax M1","created_by":"minimax","source":"official","last_updated":"2026-03-23","description":"MiniMax-M1 is a large-scale, open-weight reasoning model designed for extended context and high-efficiency inference.","context_window":1000000,"max_output_tokens":40000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"pricing":{"input":0.4,"output":2.2},"model_type":"chat","family":"minimax","release_date":"2025-06-17","tagline":"MiniMax-M1 is a large-scale, open-weight reasoning model designed for extended context and high-efficiency inference.","tools":["function_calling"]},{"id":"minimax/minimax-m2-her","name":"MiniMax: MiniMax M2-her","created_by":"minimax","source":"official","last_updated":"2026-03-23","description":"MiniMax M2-her is a dialogue-first large language model built for immersive roleplay, character-driven chat, and expressive multi-turn conversations.","context_window":65536,"max_output_tokens":2048,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.3,"output":1.2,"cached_input":0.03},"model_type":"chat","family":"minimax","release_date":"2026-01-23","tagline":"MiniMax M2-her is a dialogue-first large language model built for immersive roleplay, character-driven chat, and expressive multi-turn conversations."},{"id":"minimax/minimax-m2.1","name":"MiniMax: MiniMax M2.1","created_by":"minimax","source":"official","last_updated":"2026-05-17","description":"MiniMax-M2.1 is a lightweight, state-of-the-art large language model optimized for coding, agentic workflows, and modern application development.","context_window":204800,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.29,"output":0.95,"cached_input":0.03},"family":"minimax","model_type":"chat","release_date":"2025-12-23","tagline":"MiniMax-M2.1 is a lightweight, state-of-the-art large language model optimized for coding, agentic workflows, and modern application development.","tools":["function_calling"],"max_output_tokens":196608,"license":"mit","open_weight":true},{"id":"minimax/minimax-m2.5:free","name":"MiniMax: MiniMax M2.5 (free)","created_by":"minimax","source":"official","last_updated":"2026-05-17","description":"MiniMax-M2.5 is a SOTA large language model designed for real-world productivity.","context_window":204800,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"family":"minimax","model_type":"chat","release_date":"2026-02-12","tagline":"MiniMax-M2.5 is a SOTA large language model designed for real-world productivity.","tools":["function_calling"]},{"id":"minimax/minimax-m2.5","name":"MiniMax: MiniMax M2.5","created_by":"minimax","source":"official","last_updated":"2026-06-29","description":"MiniMax-M2.5 is a SOTA large language model designed for real-world productivity.","context_window":204800,"max_output_tokens":196608,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.12,"output":0.48,"cached_input":0.05},"family":"minimax","model_type":"chat","release_date":"2026-02-12","tagline":"MiniMax-M2.5 is a SOTA large language model designed for real-world productivity.","tools":["function_calling"],"license":"mit","open_weight":true},{"id":"minimax/minimax-m2.7","name":"MiniMax: MiniMax M2.7","created_by":"minimax","source":"official","last_updated":"2026-06-29","description":"MiniMax-M2.7 is a next-generation large language model designed for autonomous, real-world productivity and continuous improvement.","context_window":204800,"max_output_tokens":196608,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true},"pricing":{"input":0.18,"output":0.72,"cached_input":0.05},"family":"minimax","model_type":"chat","release_date":"2026-03-18","tagline":"MiniMax-M2.7 is a next-generation large language model designed for autonomous, real-world productivity and continuous improvement.","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"minimax/minimax-m2","name":"MiniMax: MiniMax M2","created_by":"minimax","source":"official","last_updated":"2026-05-17","description":"MiniMax-M2 is a compact, high-efficiency large language model optimized for end-to-end coding and agentic workflows.","context_window":204800,"max_output_tokens":196608,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true},"pricing":{"input":0.255,"output":1,"cached_input":0.03},"model_type":"chat","family":"minimax","release_date":"2025-10-23","tagline":"MiniMax-M2 is a compact, high-efficiency large language model optimized for end-to-end coding and agentic workflows.","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"minimax/minimax-m3","name":"MiniMax: MiniMax M3","created_by":"minimax","source":"official","family":"minimax","description":"MiniMax-M3 is a multimodal foundation model from MiniMax.","release_date":"2026-05-31","context_window":1048576,"max_output_tokens":512000,"model_type":"chat","tagline":"MiniMax-M3 is a multimodal foundation model from MiniMax.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.3,"output":1.2,"cached_input":0.06},"tools":["function_calling"],"last_updated":"2026-06-02","license":"proprietary","open_weight":false},{"id":"mistralai/codestral-2508","name":"Mistral: Codestral 2508","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"codestral","description":"Mistral's cutting-edge language model for coding released end of July 2025.","context_window":256000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.3,"output":0.9,"cached_input":0.03},"model_type":"code","release_date":"2025-08-01","alias":"mistralai/codestral","tagline":"Mistral's cutting-edge language model for coding released end of July 2025.","tools":["function_calling"],"license":"mnpl","open_weight":true},{"id":"mistralai/codestral","name":"Mistral: Codestral 2508","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"codestral","description":"Mistral's cutting-edge language model for coding released end of July 2025.","release_date":"2025-08-01","context_window":256000,"model_type":"code","tagline":"Mistral's cutting-edge language model for coding released end of July 2025.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.3,"output":0.9,"cached_input":0.03},"tools":["function_calling"],"snapshots":["mistralai/codestral-2508"],"license":"mnpl","open_weight":true},{"id":"mistralai/devstral-2512","name":"Mistral: Devstral 2 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"devstral","description":"Devstral 2 is a state-of-the-art open-source model by Mistral AI specializing in agentic coding.","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.4,"output":2,"cached_input":0.04},"model_type":"code","release_date":"2025-12-09","alias":"mistralai/devstral","tagline":"Devstral 2 is a state-of-the-art open-source model by Mistral AI specializing in agentic coding.","tools":["function_calling"]},{"id":"mistralai/devstral-medium","name":"Mistral: Devstral Medium","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"devstral","description":"Devstral Medium is a high-performance code generation and agentic reasoning model developed jointly by Mistral AI and All Hands AI.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true},"pricing":{"input":0.4,"output":2,"cached_input":0.04},"model_type":"chat","release_date":"2025-07-10","tagline":"Devstral Medium is a high-performance code generation and agentic reasoning model developed jointly by Mistral AI and All Hands AI.","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"mistralai/devstral-small","name":"Mistral: Devstral Small 1.1","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"devstral","description":"Devstral Small 1.1 is a 24B parameter open-weight language model for software engineering agents, developed by Mistral AI in collaboration with All Hands AI.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.1,"output":0.3,"cached_input":0.01},"model_type":"chat","release_date":"2025-07-10","tagline":"Devstral Small 1.1 is a 24B parameter open-weight language model for software engineering agents, developed by Mistral AI in collaboration with All Hands AI.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/devstral","name":"Mistral: Devstral 2 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"devstral","description":"Devstral 2 is a state-of-the-art open-source model by Mistral AI specializing in agentic coding.","release_date":"2025-12-09","context_window":262144,"model_type":"code","tagline":"Devstral 2 is a state-of-the-art open-source model by Mistral AI specializing in agentic coding.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.4,"output":2,"cached_input":0.04},"tools":["function_calling"],"snapshots":["mistralai/devstral-2512"]},{"id":"mistralai/ministral-14b-2512","name":"Mistral: Ministral 3 14B 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"ministral","description":"The largest model in the Ministral 3 family, Ministral 3 14B offers frontier capabilities and performance comparable to its larger Mistral Small 3.2 24B counterpart.","context_window":262144,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.2,"output":0.2,"cached_input":0.02},"model_type":"chat","parameters":14,"release_date":"2025-12-02","alias":"mistralai/ministral-14b","tagline":"The largest model in the Ministral 3 family, Ministral 3 14B offers frontier capabilities and performance comparable to its larger Mistral Small 3.2 24B counterpart.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/ministral-14b","name":"Mistral: Ministral 3 14B 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"ministral","description":"The largest model in the Ministral 3 family, Ministral 3 14B offers frontier capabilities and performance comparable to its larger Mistral Small 3.2 24B counterpart.","release_date":"2025-12-02","context_window":262144,"parameters":14,"model_type":"chat","tagline":"The largest model in the Ministral 3 family, Ministral 3 14B offers frontier capabilities and performance comparable to its larger Mistral Small 3.2 24B counterpart.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":0.2,"cached_input":0.02},"tools":["function_calling"],"snapshots":["mistralai/ministral-14b-2512"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/ministral-3b-2512","name":"Mistral: Ministral 3 3B 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"ministral","description":"The smallest model in the Ministral 3 family, Ministral 3 3B is a powerful, efficient tiny language model with vision capabilities.","context_window":131072,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.1,"output":0.1,"cached_input":0.01},"model_type":"chat","parameters":3,"release_date":"2025-12-02","alias":"mistralai/ministral-3b","tagline":"The smallest model in the Ministral 3 family, Ministral 3 3B is a powerful, efficient tiny language model with vision capabilities.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/ministral-3b","name":"Mistral: Ministral 3 3B 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"ministral","description":"The smallest model in the Ministral 3 family, Ministral 3 3B is a powerful, efficient tiny language model with vision capabilities.","release_date":"2025-12-02","context_window":131072,"parameters":3,"model_type":"chat","tagline":"The smallest model in the Ministral 3 family, Ministral 3 3B is a powerful, efficient tiny language model with vision capabilities.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.1,"output":0.1,"cached_input":0.01},"tools":["function_calling"],"snapshots":["mistralai/ministral-3b-2512"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/ministral-8b-2512","name":"Mistral: Ministral 3 8B 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"ministral","description":"A balanced model in the Ministral 3 family, Ministral 3 8B is a powerful, efficient tiny language model with vision capabilities.","context_window":262144,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.15,"output":0.15,"cached_input":0.015},"model_type":"chat","parameters":8,"release_date":"2025-12-02","alias":"mistralai/ministral-8b","tagline":"A balanced model in the Ministral 3 family, Ministral 3 8B is a powerful, efficient tiny language model with vision capabilities.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/ministral-8b","name":"Mistral: Ministral 3 8B 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"ministral","description":"A balanced model in the Ministral 3 family, Ministral 3 8B is a powerful, efficient tiny language model with vision capabilities.","release_date":"2025-12-02","context_window":262144,"parameters":8,"model_type":"chat","tagline":"A balanced model in the Ministral 3 family, Ministral 3 8B is a powerful, efficient tiny language model with vision capabilities.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.15,"output":0.15,"cached_input":0.015},"tools":["function_calling"],"snapshots":["mistralai/ministral-8b-2512"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-7b-instruct-v0.1","name":"Mistral: Mistral 7B Instruct v0.1","created_by":"mistral","source":"official","last_updated":"2026-05-23","description":"A 7.3B parameter model that outperforms Llama 2 13B on all benchmarks, with optimizations for speed and context length.","context_window":4096,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.11,"output":0.19},"model_type":"chat","family":"mistral-7b","parameters":7,"release_date":"2023-09-28","tagline":"A 7.3B parameter model that outperforms Llama 2 13B on all benchmarks, with optimizations for speed and context length.","status":"deprecated","deprecation_date":"2026-05-30","max_output_tokens":2824},{"id":"mistralai/mistral-large-2407","name":"Mistral Large 2407","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-large","description":"This is Mistral AI's flagship model, Mistral Large 2 (version mistral-large-2407).","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":2,"output":6,"cached_input":0.2},"model_type":"chat","release_date":"2024-11-19","alias":"mistralai/mistral-large","tagline":"This is Mistral AI's flagship model, Mistral Large 2 (version mistral-large-2407).","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-large-2411","name":"Mistral Large 2411","created_by":"mistral","source":"official","last_updated":"2026-04-07","family":"mistral-large","description":"Mistral Large 2 2411 is an update of [Mistral Large 2](/mistralai/mistral-large) released together with [Pixtral Large 2411](/mistralai/pixtral-large-2411) It provides a significant upgrade on the pre","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":2,"output":6,"cached_input":0.2},"model_type":"chat","release_date":"2024-11-19","alias":"mistralai/mistral-large","tagline":"Mistral Large 2 2411 is an update of [Mistral Large 2](/mistralai/mistral-large) released together with [Pixtral Large 2411](/mistralai/pixtral-large-2411)\n\nIt provides a significant upgrade on the pr","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-large-2512","name":"Mistral: Mistral Large 3 2512","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-large","description":"Mistral Large 3 2512 is Mistral’s most capable model to date, featuring a sparse mixture-of-experts architecture with 41B active parameters (675B total), and released under the Apache 2.0 license.","context_window":262144,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.5,"output":1.5,"cached_input":0.05},"model_type":"chat","release_date":"2025-12-01","alias":"mistralai/mistral-large","tagline":"Mistral Large 3 2512 is Mistral’s most capable model to date, featuring a sparse mixture-of-experts architecture with 41B active parameters (675B total), and released under the Apache 2.0 license.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-large","name":"Mistral Large","created_by":"mistral","source":"official","last_updated":"2026-03-26","family":"mistral-large","description":"This is Mistral AI's flagship model, Mistral Large 2 (version `mistral-large-2407`).","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":2,"output":6,"cached_input":0.2},"model_type":"chat","release_date":"2024-02-26","tagline":"Mistral Large 3 2512 is Mistral’s most capable model to date, featuring a sparse mixture-of-experts architecture with 41B active parameters (675B total), and released under the Apache 2.0 license.","tools":["function_calling"],"snapshots":["mistralai/mistral-large-2512","mistralai/mistral-large-2411","mistralai/mistral-large-2407"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-medium-3-5","name":"Mistral: Mistral Medium 3.5","created_by":"mistral","source":"official","family":"mistral-medium","description":"Mistral Medium 3.5 is a dense 128B instruction-following model from Mistral AI.","release_date":"2026-04-30","context_window":262144,"model_type":"chat","tagline":"Mistral Medium 3.5 is a dense 128B instruction-following model from Mistral AI.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.5,"output":7.5},"tools":["function_calling"],"last_updated":"2026-05-06","license":"proprietary","open_weight":false},{"id":"mistralai/mistral-medium-3.1","name":"Mistral: Mistral Medium 3.1","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-medium","description":"Mistral Medium 3.1 is an updated version of Mistral Medium 3, which is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced operational cost.","context_window":131072,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.4,"output":2,"cached_input":0.04},"model_type":"chat","release_date":"2025-08-13","tagline":"Mistral Medium 3.1 is an updated version of Mistral Medium 3, which is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced opera","tools":["function_calling"]},{"id":"mistralai/mistral-medium-3","name":"Mistral: Mistral Medium 3","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-medium","description":"Mistral Medium 3 is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced operational cost.","context_window":131072,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.4,"output":2,"cached_input":0.04},"model_type":"chat","release_date":"2025-05-07","tagline":"Mistral Medium 3 is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced operational cost.","tools":["function_calling"]},{"id":"mistralai/mistral-nemo","name":"Mistral: Mistral Nemo","created_by":"mistral","source":"official","last_updated":"2026-05-23","description":"A 12B parameter model with a 128k token context length built by Mistral in collaboration with NVIDIA.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.02,"output":0.03},"model_type":"chat","family":"mistral-nemo","release_date":"2024-07-19","tagline":"A 12B parameter model with a 128k token context length built by Mistral in collaboration with NVIDIA.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-saba","name":"Mistral: Saba","created_by":"mistral","source":"official","last_updated":"2026-03-24","description":"Mistral Saba is a 24B-parameter language model specifically designed for the Middle East and South Asia, delivering accurate and contextually relevant responses while maintaining efficient performance.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.2,"output":0.6,"cached_input":0.02},"model_type":"chat","family":"mistral-saba","release_date":"2025-02-17","tagline":"Mistral Saba is a 24B-parameter language model specifically designed for the Middle East and South Asia, delivering accurate and contextually relevant responses while maintaining efficient performance","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-small-24b-instruct-2501","name":"Mistral: Mistral Small 3","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-small","description":"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks.","context_window":32768,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.05,"output":0.08},"model_type":"chat","parameters":24,"release_date":"2025-01-30","alias":"mistralai/mistral-small-24b-instruct","tagline":"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks.","tools":["function_calling"]},{"id":"mistralai/mistral-small-24b-instruct","name":"Mistral: Mistral Small 3","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-small","description":"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks.","release_date":"2025-01-30","context_window":32768,"max_output_tokens":16384,"parameters":24,"model_type":"chat","tagline":"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.05,"output":0.08},"tools":["function_calling"],"snapshots":["mistralai/mistral-small-24b-instruct-2501"]},{"id":"mistralai/mistral-small-2603","name":"Mistral: Mistral Small 4","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-small","description":"Mistral Small 4 is the next major release in the Mistral Small family, unifying the capabilities of several flagship Mistral models into a single system.","context_window":262144,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.15,"output":0.6,"cached_input":0.015},"model_type":"chat","release_date":"2026-03-16","alias":"mistralai/mistral-small","tagline":"Mistral Small 4 is the next major release in the Mistral Small family, unifying the capabilities of several flagship Mistral models into a single system.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-small-3.1-24b-instruct:free","name":"Mistral: Mistral Small 3.1 24B (free)","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-small","description":"Mistral Small 3.1 24B Instruct is an upgraded variant of Mistral Small 3 (2501), featuring 24 billion parameters with advanced multimodal capabilities.","status":"deprecated","deprecation_date":"2026-03-29","context_window":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"model_type":"chat","parameters":24,"release_date":"2025-03-17","tagline":"Mistral Small 3.1 24B Instruct is an upgraded variant of Mistral Small 3 (2501), featuring 24 billion parameters with advanced multimodal capabilities.","tools":["function_calling"]},{"id":"mistralai/mistral-small-3.1-24b-instruct","name":"Mistral: Mistral Small 3.1 24B","created_by":"mistral","source":"official","last_updated":"2026-05-23","family":"mistral-small","description":"Mistral Small 3.1 24B Instruct is an upgraded variant of Mistral Small 3 (2501), featuring 24 billion parameters with advanced multimodal capabilities.","context_window":128000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.351,"output":0.555,"cached_input":0.015},"model_type":"chat","parameters":24,"release_date":"2025-03-17","tagline":"Mistral Small 3.1 24B Instruct is an upgraded variant of Mistral Small 3 (2501), featuring 24 billion parameters with advanced multimodal capabilities."},{"id":"mistralai/mistral-small-3.2-24b-instruct","name":"Mistral: Mistral Small 3.2 24B","created_by":"mistral","source":"official","last_updated":"2026-04-25","family":"mistral-small","description":"Mistral-Small-3.2-24B-Instruct-2506 is an updated 24B parameter model from Mistral optimized for instruction following, repetition reduction, and improved function calling.","context_window":128000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.075,"output":0.2},"model_type":"chat","parameters":24,"release_date":"2025-06-20","tagline":"Mistral-Small-3.2-24B-Instruct-2506 is an updated 24B parameter model from Mistral optimized for instruction following, repetition reduction, and improved function calling.","tools":["function_calling"],"max_output_tokens":16384},{"id":"mistralai/mistral-small-creative","name":"Mistral: Mistral Small Creative","created_by":"mistral","source":"official","last_updated":"2026-03-23","family":"mistral-small","description":"Mistral Small Creative is an experimental small model designed for creative writing, narrative generation, roleplay and character-driven dialogue, general-purpose instruction following, and conversati","status":"deprecated","deprecation_date":"2026-04-30","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.1,"output":0.3,"cached_input":0.01},"model_type":"chat","release_date":"2025-12-16","tagline":"Mistral Small Creative is an experimental small model designed for creative writing, narrative generation, roleplay and character-driven dialogue, general-purpose instruction following, and conversati","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mistral-small","name":"Mistral: Mistral Small 4","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mistral-small","description":"Mistral Small 4 is the next major release in the Mistral Small family, unifying the capabilities of several flagship Mistral models into a single system.","release_date":"2026-03-16","context_window":262144,"model_type":"chat","tagline":"Mistral Small 4 is the next major release in the Mistral Small family, unifying the capabilities of several flagship Mistral models into a single system.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.15,"output":0.6,"cached_input":0.015},"tools":["function_calling"],"snapshots":["mistralai/mistral-small-2603"],"license":"apache-2.0","open_weight":true},{"id":"mistralai/mixtral-8x22b-instruct","name":"Mistral: Mixtral 8x22B Instruct","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"mixtral","description":"Mistral's official instruct fine-tuned version of [Mixtral 8x22B](/models/mistralai/mixtral-8x22b).","context_window":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":2,"output":6,"cached_input":0.2},"model_type":"chat","release_date":"2024-04-17","tagline":"Mistral's official instruct fine-tuned version of [Mixtral 8x22B](/models/mistralai/mixtral-8x22b).","tools":["function_calling"]},{"id":"mistralai/mixtral-8x7b-instruct","name":"Mistral: Mixtral 8x7B Instruct","created_by":"mistral","source":"official","last_updated":"2026-05-07","family":"mixtral","description":"Mixtral 8x7B Instruct is a pretrained generative Sparse Mixture of Experts, by Mistral AI, for chat and instruction use.","context_window":32768,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.54,"output":0.54},"model_type":"chat","release_date":"2023-12-10","tagline":"Mixtral 8x7B Instruct is a pretrained generative Sparse Mixture of Experts, by Mistral AI, for chat and instruction use.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-07"},{"id":"mistralai/pixtral-12b","name":"Mistral: Pixtral 12B","created_by":"mistral","source":"official","last_updated":"2026-03-23","family":"pixtral","description":"The first multi-modal, text+image-to-text model from Mistral AI.","context_window":32768,"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.1,"output":0.1},"model_type":"chat","parameters":12,"release_date":"2024-09-10","tagline":"The first multi-modal, text+image-to-text model from Mistral AI.","license":"apache-2.0","open_weight":true,"capabilities":{"streaming":true,"vision":true,"tool_call":true,"fine_tuning":true}},{"id":"mistralai/pixtral-large-2411","name":"Mistral: Pixtral Large 2411","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"pixtral","description":"Pixtral Large is a 124B parameter, open-weight, multimodal model built on top of [Mistral Large 2](/mistralai/mistral-large-2411).","context_window":131072,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":2,"output":6,"cached_input":0.2},"model_type":"chat","release_date":"2024-11-19","alias":"mistralai/pixtral-large","tagline":"Pixtral Large is a 124B parameter, open-weight, multimodal model built on top of [Mistral Large 2](/mistralai/mistral-large-2411).","tools":["function_calling"],"license":"mnpl","open_weight":true},{"id":"mistralai/pixtral-large","name":"Mistral: Pixtral Large 2411","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"pixtral","description":"Pixtral Large is a 124B parameter, open-weight, multimodal model built on top of [Mistral Large 2](/mistralai/mistral-large-2411).","release_date":"2024-11-19","context_window":131072,"model_type":"chat","tagline":"Pixtral Large is a 124B parameter, open-weight, multimodal model built on top of [Mistral Large 2](/mistralai/mistral-large-2411).","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":2,"output":6,"cached_input":0.2},"tools":["function_calling"],"snapshots":["mistralai/pixtral-large-2411"],"license":"mnpl","open_weight":true},{"id":"mistralai/voxtral-small-24b-2507","name":"Mistral: Voxtral Small 24B 2507","created_by":"mistral","source":"official","last_updated":"2026-03-24","description":"Voxtral Small is an enhancement of Mistral Small 3, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance.","context_window":32000,"modalities":{"input":["text","audio"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.1,"output":0.3,"cached_input":0.01},"model_type":"audio","family":"voxtral","parameters":24,"release_date":"2025-10-30","alias":"mistralai/voxtral-small-24b","tagline":"Voxtral Small is an enhancement of Mistral Small 3, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance.","tools":["function_calling"]},{"id":"mistralai/voxtral-small-24b","name":"Mistral: Voxtral Small 24B 2507","created_by":"mistral","source":"official","last_updated":"2026-03-24","family":"voxtral","description":"Voxtral Small is an enhancement of Mistral Small 3, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance.","release_date":"2025-10-30","context_window":32000,"parameters":24,"model_type":"audio","tagline":"Voxtral Small is an enhancement of Mistral Small 3, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","audio"],"output":["text"]},"pricing":{"input":0.1,"output":0.3,"cached_input":0.01},"tools":["function_calling"],"snapshots":["mistralai/voxtral-small-24b-2507"]},{"id":"moonshotai/kimi-k2-0905","name":"MoonshotAI: Kimi K2 0905","created_by":"moonshotai","source":"official","last_updated":"2026-06-29","description":"Kimi K2 0905 is the September update of [Kimi K2 0711](moonshotai/kimi-k2).","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.6,"output":2.5,"cached_input":0.15},"family":"kimi-k2","model_type":"chat","release_date":"2025-09-04","tagline":"Kimi K2 0905 is the September update of [Kimi K2 0711](moonshotai/kimi-k2).","tools":["function_calling"],"max_output_tokens":100352,"status":"deprecated","deprecation_date":"2026-05-14"},{"id":"moonshotai/kimi-k2-thinking","name":"MoonshotAI: Kimi K2 Thinking","created_by":"moonshotai","source":"official","last_updated":"2026-06-29","description":"Kimi K2 Thinking is Moonshot AI’s most advanced open reasoning model to date, extending the K2 series into agentic, long-horizon reasoning.","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.6,"output":2.5,"cached_input":0.6},"family":"kimi-k2","model_type":"chat","release_date":"2025-11-06","tagline":"Kimi K2 Thinking is Moonshot AI’s most advanced open reasoning model to date, extending the K2 series into agentic, long-horizon reasoning.","tools":["function_calling"],"max_output_tokens":262144},{"id":"moonshotai/kimi-k2.5","name":"MoonshotAI: Kimi K2.5","created_by":"moonshotai","source":"official","last_updated":"2026-06-18","description":"Kimi K2.5 is Moonshot AI's native multimodal model, delivering state-of-the-art visual coding capability and a self-directed agent swarm paradigm.","context_window":262144,"max_output_tokens":262144,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.375,"output":2.025,"cached_input":0.09},"family":"kimi-k2.5","model_type":"chat","release_date":"2026-01-27","tagline":"Kimi K2.5 is Moonshot AI's native multimodal model, delivering state-of-the-art visual coding capability and a self-directed agent swarm paradigm.","tools":["function_calling"]},{"id":"moonshotai/kimi-k2.6:free","name":"MoonshotAI: Kimi K2.6 (free)","created_by":"moonshotai","source":"official","family":"kimi-k2.6","description":"Kimi K2.6 is Moonshot AI's next-generation multimodal model, designed for long-horizon coding, coding-driven UI/UX generation, and multi-agent orchestration.","release_date":"2026-04-20","context_window":262144,"model_type":"chat","tagline":"Kimi K2.6 is Moonshot AI's next-generation multimodal model, designed for long-horizon coding, coding-driven UI/UX generation, and multi-agent orchestration.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text","image"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"moonshotai/kimi-k2.6","name":"MoonshotAI: Kimi K2.6","created_by":"moonshotai","source":"official","family":"kimi-k2.6","description":"Kimi K2.6 is Moonshot AI's next-generation multimodal model, designed for long-horizon coding, coding-driven UI/UX generation, and multi-agent orchestration.","release_date":"2026-04-20","context_window":262144,"max_output_tokens":262144,"model_type":"chat","tagline":"Kimi K2.6 is Moonshot AI's next-generation multimodal model, designed for long-horizon coding, coding-driven UI/UX generation, and multi-agent orchestration.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.55,"output":3.2,"cached_input":0.11},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"moonshotai/kimi-k2.7-code","name":"MoonshotAI: Kimi K2.7 Code","created_by":"moonshotai","source":"official","family":"kimi-k2.7","description":"MoonshotAI: Kimi K2.7 Code is a coding-focused model in Moonshot AI's Kimi K2 family, built to complete end-to-end programming tasks reliably over long contexts.","release_date":"2026-06-12","context_window":262144,"max_output_tokens":16384,"model_type":"chat","tagline":"MoonshotAI: Kimi K2.7 Code is a coding-focused model in Moonshot AI's Kimi K2 family, built to complete end-to-end programming tasks reliably over long contexts.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.74,"output":3.5,"cached_input":0.15},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"moonshotai/kimi-k2","name":"MoonshotAI: Kimi K2 0711","created_by":"moonshotai","source":"official","last_updated":"2026-06-29","description":"Kimi K2 Instruct is a large-scale Mixture-of-Experts (MoE) language model developed by Moonshot AI, featuring 1 trillion total parameters with 32 billion active per forward pass.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.57,"output":2.3},"family":"kimi-k2","model_type":"chat","release_date":"2025-07-11","tagline":"Kimi K2 Instruct is a large-scale Mixture-of-Experts (MoE) language model developed by Moonshot AI, featuring 1 trillion total parameters with 32 billion active per forward pass.","tools":["function_calling"],"max_output_tokens":100352},{"id":"morph/morph-v3-fast","name":"Morph: Morph V3 Fast","created_by":"morph","source":"official","last_updated":"2026-03-23","description":"Morph's fastest apply model for code edits.","context_window":81920,"max_output_tokens":38000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.8,"output":1.2},"release_date":"2025-07-07","tagline":"Morph's fastest apply model for code edits."},{"id":"morph/morph-v3-large","name":"Morph: Morph V3 Large","created_by":"morph","source":"official","last_updated":"2026-06-20","description":"Morph's high-accuracy apply model for complex code edits.","context_window":262144,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.9,"output":1.9},"release_date":"2025-07-07","tagline":"Morph's high-accuracy apply model for complex code edits.","capabilities":{"structured_output":true,"json_mode":true}},{"id":"nex-agi/deepseek-v3.1-nex-n1","name":"Nex AGI: DeepSeek V3.1 Nex N1","created_by":"nex-agi","source":"official","last_updated":"2026-06-03","family":"deepseek","description":"DeepSeek V3.1 Nex-N1 is the flagship release of the Nex-N1 series — a post-trained model designed to highlight agent autonomy, tool use, and real-world productivity.","context_window":131072,"max_output_tokens":163840,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.135,"output":0.5},"release_date":"2025-12-08","tagline":"DeepSeek V3.1 Nex-N1 is the flagship release of the Nex-N1 series — a post-trained model designed to highlight agent autonomy, tool use, and real-world productivity.","tools":["function_calling"],"model_type":"chat","status":"deprecated","deprecation_date":"2026-06-08"},{"id":"nex-agi/nex-n2-pro:free","name":"Nex AGI: Nex-N2-Pro (free)","created_by":"nex-agi","source":"official","description":"Nex-N2-Pro is an agentic mixture-of-experts model from Nex AGI, with 17B active parameters out of 397B total.","release_date":"2026-06-08","context_window":262144,"max_output_tokens":262144,"tagline":"Nex-N2-Pro is an agentic mixture-of-experts model from Nex AGI, with 17B active parameters out of 397B total.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-20","status":"deprecated","deprecation_date":"2026-06-22"},{"id":"nex-agi/nex-n2-pro","name":"Nex AGI: Nex-N2-Pro","created_by":"nex-agi","source":"official","description":"Nex-N2-Pro is an agentic mixture-of-experts model from Nex AGI, with 17B active parameters out of 397B total.","release_date":"2026-06-08","context_window":262144,"max_output_tokens":262144,"tagline":"Nex-N2-Pro is an agentic mixture-of-experts model from Nex AGI, with 17B active parameters out of 397B total.","capabilities":{"reasoning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":1,"cached_input":0.025},"last_updated":"2026-06-29"},{"id":"nousresearch/hermes-2-pro-llama-3-8b","name":"NousResearch: Hermes 2 Pro - Llama-3 8B","created_by":"nousresearch","source":"official","last_updated":"2026-05-29","description":"Hermes 2 Pro is an upgraded, retrained version of Nous Hermes 2, consisting of an updated and cleaned version of the OpenHermes 2.5 Dataset, as well as a newly introduced...","context_window":8192,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.14,"output":0.14},"model_type":"chat","parameters":8,"release_date":"2024-05-27","tagline":"Hermes 2 Pro is an upgraded, retrained version of Nous Hermes 2, consisting of an updated and cleaned version of the OpenHermes 2.5 Dataset, as well as a newly introduced Function Calling and JSON Mod","status":"deprecated","deprecation_date":"2026-06-05"},{"id":"nousresearch/hermes-3-llama-3.1-405b:free","name":"Nous: Hermes 3 405B Instruct (free)","created_by":"nousresearch","source":"official","last_updated":"2026-04-07","description":"Hermes 3 is a generalist language model with many improvements over Hermes 2, including advanced agentic capabilities, much better roleplaying, reasoning, multi-turn conversation, long context coheren","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"model_type":"chat","release_date":"2024-08-16","tagline":"Hermes 3 is a generalist language model with many improvements over Hermes 2, including advanced agentic capabilities, much better roleplaying, reasoning, multi-turn conversation, long context coheren"},{"id":"nousresearch/hermes-3-llama-3.1-405b","name":"Nous: Hermes 3 405B Instruct","created_by":"nousresearch","source":"official","last_updated":"2026-04-07","description":"Hermes 3 is a generalist language model with many improvements over Hermes 2, including advanced agentic capabilities, much better roleplaying, reasoning, multi-turn conversation, long context coheren","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":1,"output":1},"model_type":"chat","parameters":405,"release_date":"2024-08-16","tagline":"Hermes 3 is a generalist language model with many improvements over Hermes 2, including advanced agentic capabilities, much better roleplaying, reasoning, multi-turn conversation, long context coheren"},{"id":"nousresearch/hermes-3-llama-3.1-70b","name":"Nous: Hermes 3 70B Instruct","created_by":"nousresearch","source":"official","last_updated":"2026-06-10","description":"Hermes 3 is a generalist language model with many improvements over [Hermes 2](/models/nousresearch/nous-hermes-2-mistral-7b-dpo), including advanced agentic capabilities, much better roleplaying, rea","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.7,"output":0.7},"model_type":"chat","parameters":70,"release_date":"2024-08-18","tagline":"Hermes 3 is a generalist language model with many improvements over [Hermes 2](/models/nousresearch/nous-hermes-2-mistral-7b-dpo), including advanced agentic capabilities, much better roleplaying, rea","max_output_tokens":16384},{"id":"nousresearch/hermes-4-405b","name":"Nous: Hermes 4 405B","created_by":"nousresearch","source":"official","last_updated":"2026-03-24","description":"Hermes 4 is a large-scale reasoning model built on Meta-Llama-3.1-405B and released by Nous Research.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":1,"output":3},"model_type":"chat","parameters":405,"release_date":"2025-08-26","tagline":"Hermes 4 is a large-scale reasoning model built on Meta-Llama-3.1-405B and released by Nous Research."},{"id":"nousresearch/hermes-4-70b","name":"Nous: Hermes 4 70B","created_by":"nousresearch","source":"official","last_updated":"2026-03-24","description":"Hermes 4 70B is a hybrid reasoning model from Nous Research, built on Meta-Llama-3.1-70B.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.13,"output":0.4},"model_type":"chat","parameters":70,"release_date":"2025-08-26","tagline":"Hermes 4 70B is a hybrid reasoning model from Nous Research, built on Meta-Llama-3.1-70B."},{"id":"nvidia/llama-3.1-nemotron-70b-instruct","name":"NVIDIA: Llama 3.1 Nemotron 70B Instruct","created_by":"nvidia","source":"official","last_updated":"2026-05-07","family":"llama-3.1","description":"NVIDIA's Llama 3.1 Nemotron 70B is a language model designed for generating precise and useful responses.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":1.2,"output":1.2},"model_type":"chat","parameters":70,"release_date":"2024-10-15","tagline":"NVIDIA's Llama 3.1 Nemotron 70B is a language model designed for generating precise and useful responses.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-07"},{"id":"nvidia/llama-3.1-nemotron-ultra-253b-v1","name":"NVIDIA: Llama 3.1 Nemotron Ultra 253B v1","created_by":"nvidia","source":"official","last_updated":"2026-03-24","family":"llama-3.1","description":"Llama-3.1-Nemotron-Ultra-253B-v1 is a large language model (LLM) optimized for advanced reasoning, human-interactive chat, retrieval-augmented generation (RAG), and tool-calling tasks.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.6,"output":1.8},"model_type":"chat","parameters":253,"release_date":"2025-04-08","tagline":"Llama-3.1-Nemotron-Ultra-253B-v1 is a large language model (LLM) optimized for advanced reasoning, human-interactive chat, retrieval-augmented generation (RAG), and tool-calling tasks."},{"id":"nvidia/llama-3.3-nemotron-super-49b-v1.5","name":"NVIDIA: Llama 3.3 Nemotron Super 49B V1.5","created_by":"nvidia","source":"official","last_updated":"2026-06-10","family":"llama-3.3","description":"Llama-3.3-Nemotron-Super-49B-v1.5 is a 49B-parameter, English-centric reasoning/chat model derived from Meta’s Llama-3.3-70B-Instruct with a 128K context.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.4,"output":0.4},"model_type":"chat","parameters":49,"release_date":"2025-10-10","tagline":"Llama-3.3-Nemotron-Super-49B-v1.5 is a 49B-parameter, English-centric reasoning/chat model derived from Meta’s Llama-3.3-70B-Instruct with a 128K context.","tools":["function_calling"],"max_output_tokens":16384},{"id":"nvidia/nemotron-3-nano-30b-a3b:free","name":"NVIDIA: Nemotron 3 Nano 30B A3B (free)","created_by":"nvidia","source":"official","last_updated":"2026-03-23","description":"NVIDIA Nemotron 3 Nano 30B A3B is a small language MoE model with highest compute efficiency and accuracy for developers to build specialized agentic AI systems.","context_window":256000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-12-14","tagline":"NVIDIA Nemotron 3 Nano 30B A3B is a small language MoE model with highest compute efficiency and accuracy for developers to build specialized agentic AI systems.","tools":["function_calling"]},{"id":"nvidia/nemotron-3-nano-30b-a3b","name":"NVIDIA: Nemotron 3 Nano 30B A3B","created_by":"nvidia","source":"official","last_updated":"2026-04-25","description":"NVIDIA Nemotron 3 Nano 30B A3B is a small language MoE model with highest compute efficiency and accuracy for developers to build specialized agentic AI systems.","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.05,"output":0.2},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-12-14","tagline":"NVIDIA Nemotron 3 Nano 30B A3B is a small language MoE model with highest compute efficiency and accuracy for developers to build specialized agentic AI systems.","tools":["function_calling"],"max_output_tokens":228000},{"id":"nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free","name":"NVIDIA: Nemotron 3 Nano Omni (free)","created_by":"nvidia","source":"official","description":"NVIDIA Nemotron™ 3 Nano Omni is a 30B-A3B open multimodal model designed to function as a perception and context sub-agent in enterprise agent systems.","release_date":"2026-04-28","context_window":256000,"max_output_tokens":65536,"parameters":30,"active_parameters":3,"model_type":"reasoning","tagline":"NVIDIA Nemotron™ 3 Nano Omni is a 30B-A3B open multimodal model designed to function as a perception and context sub-agent in enterprise agent systems.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text","audio","image","video"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"nvidia/nemotron-3-super-120b-a12b:free","name":"NVIDIA: Nemotron 3 Super (free)","created_by":"nvidia","source":"official","last_updated":"2026-05-17","description":"NVIDIA Nemotron 3 Super is a 120B-parameter open hybrid MoE model, activating just 12B parameters for maximum compute efficiency and accuracy in complex multi-agent applications.","context_window":1000000,"max_output_tokens":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"model_type":"chat","parameters":120,"active_parameters":12,"release_date":"2026-03-11","tagline":"NVIDIA Nemotron 3 Super is a 120B-parameter open hybrid MoE model, activating just 12B parameters for maximum compute efficiency and accuracy in complex multi-agent applications.","tools":["function_calling"]},{"id":"nvidia/nemotron-3-super-120b-a12b","name":"NVIDIA: Nemotron 3 Super","created_by":"nvidia","source":"official","last_updated":"2026-06-29","description":"NVIDIA Nemotron 3 Super is a 120B-parameter open hybrid MoE model, activating just 12B parameters for maximum compute efficiency and accuracy in complex multi-agent applications.","context_window":1000000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.085,"output":0.4,"cached_input":0.1},"model_type":"chat","parameters":120,"active_parameters":12,"release_date":"2026-03-11","tagline":"NVIDIA Nemotron 3 Super is a 120B-parameter open hybrid MoE model, activating just 12B parameters for maximum compute efficiency and accuracy in complex multi-agent applications.","tools":["function_calling"],"max_output_tokens":16384},{"id":"nvidia/nemotron-3-ultra-550b-a55b:free","name":"NVIDIA: Nemotron 3 Ultra (free)","created_by":"nvidia","source":"official","description":"NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE).","release_date":"2026-06-04","context_window":1000000,"max_output_tokens":65536,"parameters":550,"active_parameters":55,"model_type":"chat","tagline":"NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE).","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-10"},{"id":"nvidia/nemotron-3-ultra-550b-a55b","name":"NVIDIA: Nemotron 3 Ultra","created_by":"nvidia","source":"official","description":"NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE).","release_date":"2026-06-04","context_window":1000000,"max_output_tokens":16384,"parameters":550,"active_parameters":55,"model_type":"chat","tagline":"NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE).","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.5,"output":2.2,"cached_input":0.1},"tools":["function_calling"],"last_updated":"2026-06-18"},{"id":"nvidia/nemotron-3.5-content-safety:free","name":"NVIDIA: Nemotron 3.5 Content Safety (free)","created_by":"nvidia","source":"official","description":"NVIDIA Nemotron 3.5 Content Safety is a compact 4B-parameter multimodal guardrail model from NVIDIA, fine-tuned from Google Gemma-3-4B.","release_date":"2026-06-04","context_window":128000,"max_output_tokens":8192,"model_type":"chat","tagline":"NVIDIA Nemotron 3.5 Content Safety is a compact 4B-parameter multimodal guardrail model from NVIDIA, fine-tuned from Google Gemma-3-4B.","capabilities":{"reasoning":true},"modalities":{"input":["text","image"],"output":["text"]},"last_updated":"2026-06-10"},{"id":"nvidia/nemotron-nano-12b-v2-vl:free","name":"NVIDIA: Nemotron Nano 12B 2 VL (free)","created_by":"nvidia","source":"official","last_updated":"2026-03-23","description":"NVIDIA Nemotron Nano 2 VL is a 12-billion-parameter open multimodal reasoning model designed for video understanding and document intelligence.","context_window":128000,"max_output_tokens":128000,"modalities":{"input":["image","text","video"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"model_type":"chat","parameters":12,"release_date":"2025-10-28","tagline":"NVIDIA Nemotron Nano 2 VL is a 12-billion-parameter open multimodal reasoning model designed for video understanding and document intelligence.","tools":["function_calling"]},{"id":"nvidia/nemotron-nano-12b-v2-vl","name":"NVIDIA: Nemotron Nano 12B 2 VL","created_by":"nvidia","source":"official","last_updated":"2026-05-01","description":"NVIDIA Nemotron Nano 2 VL is a 12-billion-parameter open multimodal reasoning model designed for video understanding and document intelligence.","context_window":131072,"modalities":{"input":["image","text","video"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.2,"output":0.6},"model_type":"chat","parameters":12,"release_date":"2025-10-28","tagline":"NVIDIA Nemotron Nano 2 VL is a 12-billion-parameter open multimodal reasoning model designed for video understanding and document intelligence.","max_output_tokens":16384,"status":"deprecated","deprecation_date":"2026-05-07"},{"id":"nvidia/nemotron-nano-9b-v2:free","name":"NVIDIA: Nemotron Nano 9B V2 (free)","created_by":"nvidia","source":"official","last_updated":"2026-03-24","description":"NVIDIA-Nemotron-Nano-9B-v2 is a large language model (LLM) trained from scratch by NVIDIA, and designed as a unified model for both reasoning and non-reasoning tasks.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"model_type":"chat","parameters":9,"release_date":"2025-09-05","tagline":"NVIDIA-Nemotron-Nano-9B-v2 is a large language model (LLM) trained from scratch by NVIDIA, and designed as a unified model for both reasoning and non-reasoning tasks.","tools":["function_calling"]},{"id":"nvidia/nemotron-nano-9b-v2","name":"NVIDIA: Nemotron Nano 9B V2","created_by":"nvidia","source":"official","last_updated":"2026-06-10","description":"NVIDIA-Nemotron-Nano-9B-v2 is a large language model (LLM) trained from scratch by NVIDIA, and designed as a unified model for both reasoning and non-reasoning tasks.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.04,"output":0.16},"model_type":"chat","parameters":9,"release_date":"2025-09-05","tagline":"NVIDIA-Nemotron-Nano-9B-v2 is a large language model (LLM) trained from scratch by NVIDIA, and designed as a unified model for both reasoning and non-reasoning tasks.","tools":["function_calling"],"max_output_tokens":16384,"status":"deprecated","deprecation_date":"2026-06-11"},{"id":"openai/gpt-3.5-turbo-0613","name":"OpenAI: GPT-3.5 Turbo (older v0613)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-3.5","description":"GPT-3.5 Turbo is OpenAI's fastest model.","context_window":4095,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"fine_tuning":true,"streaming":false,"vision":false,"reasoning":false,"batch":true},"pricing":{"input":1,"output":2},"model_type":"chat","release_date":"2024-01-25","tagline":"GPT-3.5 Turbo is OpenAI's fastest model.","tools":["function_calling"],"knowledge_cutoff":"2021-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-3.5-turbo-16k","name":"OpenAI: GPT-3.5 Turbo 16k","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-3.5","description":"This model offers four times the context length of gpt-3.5-turbo, allowing it to support approximately 20 pages of text in a single request at a higher cost.","context_window":16385,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":3,"output":4},"model_type":"chat","release_date":"2023-08-28","tagline":"This model offers four times the context length of gpt-3.5-turbo, allowing it to support approximately 20 pages of text in a single request at a higher cost.","tools":["function_calling"]},{"id":"openai/gpt-3.5-turbo-instruct","name":"OpenAI: GPT-3.5 Turbo Instruct","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-3.5","description":"This model is a variant of GPT-3.5 Turbo tuned for instructional prompts and omitting chat-related optimizations.","context_window":4095,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"fine_tuning":true,"streaming":false,"vision":false,"tool_call":false,"reasoning":false},"pricing":{"input":1.5,"output":2},"model_type":"chat","release_date":"2023-09-28","tagline":"This model is a variant of GPT-3.5 Turbo tuned for instructional prompts and omitting chat-related optimizations.","knowledge_cutoff":"2021-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-3.5-turbo","name":"OpenAI: GPT-3.5 Turbo","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-3.5","description":"GPT-3.5 Turbo is OpenAI's fastest model.","context_window":16385,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"fine_tuning":true,"streaming":false,"vision":false,"reasoning":false,"batch":true},"pricing":{"input":0.5,"output":1.5},"model_type":"chat","release_date":"2023-05-28","tagline":"GPT-3.5 Turbo is OpenAI's fastest model.","tools":["function_calling"],"knowledge_cutoff":"2021-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-4-0314","name":"OpenAI: GPT-4 (older v0314)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4","description":"GPT-4-0314 is the first version of GPT-4 released, with a context length of 8,192 tokens, and was supported until June 14.","context_window":8191,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":30,"output":60},"model_type":"chat","release_date":"2023-05-28","tagline":"GPT-4-0314 is the first version of GPT-4 released, with a context length of 8,192 tokens, and was supported until June 14.","tools":["function_calling"]},{"id":"openai/gpt-4-1106-preview","name":"OpenAI: GPT-4 Turbo (older v1106)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4","description":"The latest GPT-4 Turbo model with vision capabilities.","context_window":128000,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":10,"output":30},"model_type":"chat","release_date":"2023-11-06","tagline":"The latest GPT-4 Turbo model with vision capabilities.","tools":["function_calling"]},{"id":"openai/gpt-4-turbo-preview","name":"OpenAI: GPT-4 Turbo Preview","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4-turbo","description":"The preview GPT-4 model with improved instruction following, JSON mode, reproducible outputs, parallel function calling, and more.","context_window":128000,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":10,"output":30},"model_type":"chat","release_date":"2024-01-25","tagline":"The preview GPT-4 model with improved instruction following, JSON mode, reproducible outputs, parallel function calling, and more.","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"openai/gpt-4-turbo","name":"OpenAI: GPT-4 Turbo","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4-turbo","description":"The latest GPT-4 Turbo model with vision capabilities.","context_window":128000,"max_output_tokens":4096,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"reasoning":false,"batch":true},"pricing":{"input":10,"output":30},"model_type":"chat","release_date":"2024-04-09","tagline":"The latest GPT-4 Turbo model with vision capabilities.","tools":["function_calling"],"knowledge_cutoff":"2023-12","license":"proprietary","open_weight":false},{"id":"openai/gpt-4.1-mini","name":"OpenAI: GPT-4.1 Mini","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4.1","description":"GPT-4.1 Mini is a mid-sized model delivering performance competitive with GPT-4o at substantially lower latency and cost.","context_window":1047576,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"reasoning":false,"batch":true},"pricing":{"input":0.4,"output":1.6,"cached_input":0.1},"model_type":"chat","release_date":"2025-04-14","tagline":"GPT-4.1 Mini is a mid-sized model delivering performance competitive with GPT-4o at substantially lower latency and cost.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openai/gpt-4.1-nano","name":"OpenAI: GPT-4.1 Nano","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4.1","description":"For tasks that demand low latency, GPT‑4.1 nano is the fastest and cheapest model in the GPT-4.1 series.","context_window":1047576,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"reasoning":false,"batch":true},"pricing":{"input":0.1,"output":0.4,"cached_input":0.025},"model_type":"chat","release_date":"2025-04-14","tagline":"For tasks that demand low latency, GPT‑4.1 nano is the fastest and cheapest model in the GPT-4.1 series.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openai/gpt-4.1","name":"OpenAI: GPT-4.1","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4.1","description":"GPT-4.1 is a flagship large language model optimized for advanced instruction following, real-world software engineering, and long-context reasoning.","context_window":1047576,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"reasoning":false,"batch":true},"pricing":{"input":2,"output":8,"cached_input":0.5},"model_type":"chat","release_date":"2025-04-14","tagline":"GPT-4.1 is a flagship large language model optimized for advanced instruction following, real-world software engineering, and long-context reasoning.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openai/gpt-4","name":"OpenAI: GPT-4","created_by":"openai","source":"official","last_updated":"2026-04-07","family":"gpt-4","description":"OpenAI's flagship model, GPT-4 is a large-scale multimodal language model capable of solving difficult problems with greater accuracy than previous models due to its broader general knowledge and adva","context_window":8191,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true,"vision":false,"reasoning":false,"batch":true},"pricing":{"input":30,"output":60},"model_type":"chat","release_date":"2023-05-28","tagline":"OpenAI's flagship model, GPT-4 is a large-scale multimodal language model capable of solving difficult problems with greater accuracy than previous models due to its broader general knowledge and adva","tools":["function_calling"],"knowledge_cutoff":"2023-12","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o-2024-05-13","name":"OpenAI: GPT-4o (2024-05-13)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs.","context_window":128000,"max_output_tokens":4096,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"reasoning":false,"batch":true},"pricing":{"input":5,"output":15,"cached_input":1.25},"model_type":"chat","release_date":"2024-05-13","alias":"openai/gpt-4o","tagline":"GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs.","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o-2024-08-06","name":"OpenAI: GPT-4o (2024-08-06)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"The 2024-08-06 version of GPT-4o offers improved performance in structured outputs, with the ability to supply a JSON schema in the respone_format.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"reasoning":false,"batch":true},"pricing":{"input":2.5,"output":10,"cached_input":1.25},"model_type":"chat","release_date":"2024-08-06","alias":"openai/gpt-4o","tagline":"The 2024-08-06 version of GPT-4o offers improved performance in structured outputs, with the ability to supply a JSON schema in the respone_format.","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o-2024-11-20","name":"OpenAI: GPT-4o (2024-11-20)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"The 2024-11-20 version of GPT-4o offers a leveled-up creative writing ability with more natural, engaging, and tailored writing to improve relevance & readability.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"reasoning":false,"batch":true},"pricing":{"input":2.5,"output":10,"cached_input":1.25},"model_type":"chat","release_date":"2024-11-20","alias":"openai/gpt-4o","tagline":"The 2024-11-20 version of GPT-4o offers a leveled-up creative writing ability with more natural, engaging, and tailored writing to improve relevance & readability.","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o-audio-preview","name":"OpenAI: GPT-4o Audio","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"The gpt-4o-audio-preview model adds support for audio inputs as prompts.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["audio","text"],"output":["text","audio"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":false,"fine_tuning":false,"reasoning":false},"pricing":{"input":2.5,"output":10},"model_type":"chat","release_date":"2025-08-15","tagline":"The gpt-4o-audio-preview model adds support for audio inputs as prompts.","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o:extended","name":"OpenAI: GPT-4o (extended)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs.","context_window":128000,"max_output_tokens":64000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":6,"output":18},"model_type":"chat","release_date":"2024-05-13","tagline":"GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs.","tools":["function_calling"]},{"id":"openai/gpt-4o-mini-2024-07-18","name":"OpenAI: GPT-4o-mini (2024-07-18)","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"reasoning":false,"batch":true},"pricing":{"input":0.15,"output":0.6,"cached_input":0.075},"model_type":"chat","release_date":"2024-07-18","alias":"openai/gpt-4o-mini","tagline":"GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs.","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o-mini-search-preview","name":"OpenAI: GPT-4o-mini Search Preview","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"GPT-4o mini Search Preview is a specialized model for web search in Chat Completions.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"tool_call":false,"fine_tuning":false,"reasoning":false},"pricing":{"input":0.15,"output":0.6},"model_type":"chat","release_date":"2025-03-12","tagline":"GPT-4o mini Search Preview is a specialized model for web search in Chat Completions.","knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o-mini","name":"OpenAI: GPT-4o-mini (2024-07-18)","created_by":"openai","source":"official","last_updated":"2026-06-29","family":"gpt-4o","description":"GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"reasoning":false,"batch":true},"pricing":{"input":0.15,"output":0.6,"cached_input":0.075},"model_type":"chat","release_date":"2024-07-18","tagline":"GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs.","tools":["function_calling"],"snapshots":["openai/gpt-4o-mini-2024-07-18"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o-search-preview","name":"OpenAI: GPT-4o Search Preview","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-4o","description":"GPT-4o Search Previewis a specialized model for web search in Chat Completions.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"tool_call":false,"fine_tuning":false,"reasoning":false},"pricing":{"input":2.5,"output":10},"model_type":"chat","release_date":"2025-03-12","tagline":"GPT-4o Search Previewis a specialized model for web search in Chat Completions.","knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-4o","name":"OpenAI: GPT-4o","created_by":"openai","source":"official","last_updated":"2026-06-03","family":"gpt-4o","description":"GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"reasoning":false,"batch":true},"pricing":{"input":2.5,"output":10,"cached_input":1.25},"model_type":"chat","release_date":"2024-05-13","tagline":"The 2024-11-20 version of GPT-4o offers a leveled-up creative writing ability with more natural, engaging, and tailored writing to improve relevance & readability.","tools":["function_calling"],"snapshots":["openai/gpt-4o-2024-11-20","openai/gpt-4o-2024-08-06","openai/gpt-4o-2024-05-13"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-5-chat","name":"OpenAI: GPT-5 Chat","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5","description":"GPT-5 Chat is designed for advanced, natural, multimodal, and context-aware conversations for enterprise applications.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":1.25,"output":10,"cached_input":0.125},"model_type":"chat","release_date":"2025-08-07","tagline":"GPT-5 Chat is designed for advanced, natural, multimodal, and context-aware conversations for enterprise applications."},{"id":"openai/gpt-5-codex","name":"OpenAI: GPT-5 Codex","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5","description":"GPT-5-Codex is a specialized version of GPT-5 optimized for software engineering and coding workflows.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":1.25,"output":10,"cached_input":0.125},"model_type":"chat","release_date":"2025-09-23","tagline":"GPT-5-Codex is a specialized version of GPT-5 optimized for software engineering and coding workflows.","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2024-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-5-image-mini","name":"OpenAI: GPT-5 Image Mini","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5","description":"GPT-5 Image Mini combines OpenAI's advanced language capabilities, powered by [GPT-5 Mini](https://openrouter.ai/openai/gpt-5-mini), with GPT Image 1 Mini for efficient image generation.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["image","text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":2.5,"output":2,"cached_input":0.25},"model_type":"chat","release_date":"2025-10-16","tagline":"GPT-5 Image Mini combines OpenAI's advanced language capabilities, powered by [GPT-5 Mini](https://openrouter.ai/openai/gpt-5-mini), with GPT Image 1 Mini for efficient image generation.","tools":["function_calling"]},{"id":"openai/gpt-5-image","name":"OpenAI: GPT-5 Image","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5","description":"[GPT-5](https://openrouter.ai/openai/gpt-5) Image combines OpenAI's GPT-5 model with state-of-the-art image generation capabilities.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["image","text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":10,"output":10,"cached_input":1.25},"model_type":"chat","release_date":"2025-10-14","tagline":"[GPT-5](https://openrouter.ai/openai/gpt-5) Image combines OpenAI's GPT-5 model with state-of-the-art image generation capabilities.","tools":["function_calling"]},{"id":"openai/gpt-5-mini","name":"OpenAI: GPT-5 Mini","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5","description":"GPT-5 Mini is a compact version of GPT-5, designed to handle lighter-weight reasoning tasks.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":0.25,"output":2,"cached_input":0.025},"model_type":"chat","release_date":"2025-08-07","tagline":"GPT-5 Mini is a compact version of GPT-5, designed to handle lighter-weight reasoning tasks.","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2024-05","license":"proprietary","open_weight":false},{"id":"openai/gpt-5-nano","name":"OpenAI: GPT-5 Nano","created_by":"openai","source":"official","last_updated":"2026-04-12","family":"gpt-5","description":"GPT-5-Nano is the smallest and fastest variant in the GPT-5 system, optimized for developer tools, rapid interactions, and ultra-low latency environments.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":0.05,"output":0.4,"cached_input":0.01},"model_type":"chat","release_date":"2025-08-07","tagline":"GPT-5-Nano is the smallest and fastest variant in the GPT-5 system, optimized for developer tools, rapid interactions, and ultra-low latency environments.","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2024-05","license":"proprietary","open_weight":false},{"id":"openai/gpt-5-pro","name":"OpenAI: GPT-5 Pro","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5","description":"GPT-5 Pro is OpenAI’s most advanced model, offering major improvements in reasoning, code quality, and user experience.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":15,"output":120},"model_type":"chat","release_date":"2025-10-06","tagline":"GPT-5 Pro is OpenAI’s most advanced model, offering major improvements in reasoning, code quality, and user experience.","tools":["function_calling"],"knowledge_cutoff":"2024-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.1-chat","name":"OpenAI: GPT-5.1 Chat","created_by":"openai","source":"official","last_updated":"2026-05-29","family":"gpt-5.1","description":"GPT-5.1 Chat (AKA Instant is the fast, lightweight member of the 5.1 family, optimized for low-latency chat while retaining strong general intelligence.","context_window":128000,"max_output_tokens":32000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":1.25,"output":10,"cached_input":0.13},"model_type":"chat","release_date":"2025-11-13","tagline":"GPT-5.1 Chat (AKA Instant is the fast, lightweight member of the 5.1 family, optimized for low-latency chat while retaining strong general intelligence.","tools":["function_calling"]},{"id":"openai/gpt-5.1-codex-max","name":"OpenAI: GPT-5.1-Codex-Max","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.1","description":"GPT-5.1-Codex-Max is OpenAI’s latest agentic coding model, designed for long-running, high-context software development tasks.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":1.25,"output":10,"cached_input":0.125},"model_type":"chat","release_date":"2025-12-04","tagline":"GPT-5.1-Codex-Max is OpenAI’s latest agentic coding model, designed for long-running, high-context software development tasks.","tools":["function_calling"],"knowledge_cutoff":"2024-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.1-codex-mini","name":"OpenAI: GPT-5.1-Codex-Mini","created_by":"openai","source":"official","last_updated":"2026-05-29","family":"gpt-5.1","description":"GPT-5.1-Codex-Mini is a smaller and faster version of GPT-5.1-Codex","context_window":400000,"max_output_tokens":100000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":0.25,"output":2,"cached_input":0.025},"model_type":"chat","release_date":"2025-11-13","tagline":"GPT-5.1-Codex-Mini is a smaller and faster version of GPT-5.1-Codex","tools":["function_calling"],"knowledge_cutoff":"2024-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.1-codex","name":"OpenAI: GPT-5.1-Codex","created_by":"openai","source":"official","last_updated":"2026-05-29","family":"gpt-5.1","description":"GPT-5.1-Codex is a specialized version of GPT-5.1 optimized for software engineering and coding workflows.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":1.25,"output":10,"cached_input":0.13},"model_type":"chat","release_date":"2025-11-13","tagline":"GPT-5.1-Codex is a specialized version of GPT-5.1 optimized for software engineering and coding workflows.","tools":["function_calling"],"knowledge_cutoff":"2024-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.1","name":"OpenAI: GPT-5.1","created_by":"openai","source":"official","last_updated":"2026-04-12","family":"gpt-5.1","description":"GPT-5.1 is the latest frontier-grade model in the GPT-5 series, offering stronger general-purpose reasoning, improved instruction adherence, and a more natural conversational style compared to GPT-5.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":1.25,"output":10,"cached_input":0.13},"model_type":"chat","release_date":"2025-11-13","tagline":"GPT-5.1 is the latest frontier-grade model in the GPT-5 series, offering stronger general-purpose reasoning, improved instruction adherence, and a more natural conversational style compared to GPT-5.","tools":["function_calling"],"knowledge_cutoff":"2024-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.2-chat","name":"OpenAI: GPT-5.2 Chat","created_by":"openai","source":"official","last_updated":"2026-05-29","family":"gpt-5.2","description":"GPT-5.2 Chat (AKA Instant) is the fast, lightweight member of the 5.2 family, optimized for low-latency chat while retaining strong general intelligence.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":1.75,"output":14,"cached_input":0.175},"model_type":"chat","release_date":"2025-12-10","tagline":"GPT-5.2 Chat (AKA Instant) is the fast, lightweight member of the 5.2 family, optimized for low-latency chat while retaining strong general intelligence.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-08-10"},{"id":"openai/gpt-5.2-codex","name":"OpenAI: GPT-5.2-Codex","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.2","description":"GPT-5.2-Codex is an upgraded version of GPT-5.1-Codex optimized for software engineering and coding workflows.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":1.75,"output":14,"cached_input":0.175},"model_type":"chat","release_date":"2026-01-14","tagline":"GPT-5.2-Codex is an upgraded version of GPT-5.1-Codex optimized for software engineering and coding workflows.","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.2-pro","name":"OpenAI: GPT-5.2 Pro","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.2","description":"GPT-5.2 Pro is OpenAI’s most advanced model, offering major improvements in agentic coding and long context performance over GPT-5 Pro.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":21,"output":168},"model_type":"chat","release_date":"2025-12-10","tagline":"GPT-5.2 Pro is OpenAI’s most advanced model, offering major improvements in agentic coding and long context performance over GPT-5 Pro.","tools":["function_calling"],"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.2","name":"OpenAI: GPT-5.2","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.2","description":"GPT-5.2 is the latest frontier-grade model in the GPT-5 series, offering stronger agentic and long context perfomance compared to GPT-5.1.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":1.75,"output":14,"cached_input":0.175},"model_type":"chat","release_date":"2025-12-10","tagline":"GPT-5.2 is the latest frontier-grade model in the GPT-5 series, offering stronger agentic and long context perfomance compared to GPT-5.1.","tools":["function_calling"],"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.3-chat","name":"OpenAI: GPT-5.3 Chat","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.3","description":"GPT-5.3 Chat is an update to ChatGPT's most-used model that makes everyday conversations smoother, more useful, and more directly helpful.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":1.75,"output":14,"cached_input":0.175},"model_type":"chat","release_date":"2026-03-03","tagline":"GPT-5.3 Chat is an update to ChatGPT's most-used model that makes everyday conversations smoother, more useful, and more directly helpful.","tools":["function_calling"]},{"id":"openai/gpt-5.3-codex","name":"OpenAI: GPT-5.3-Codex","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.3","description":"GPT-5.3-Codex is OpenAI’s most advanced agentic coding model, combining the frontier software engineering performance of GPT-5.2-Codex with the broader reasoning and professional knowledge capabilities of GPT-5.2.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":1.75,"output":14,"cached_input":0.175},"model_type":"chat","release_date":"2026-02-24","tagline":"GPT-5.3-Codex is OpenAI’s most advanced agentic coding model, combining the frontier software engineering performance of GPT-5.2-Codex with the broader reasoning and professional knowledge capabilitie","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.4-image-2","name":"OpenAI: GPT-5.4 Image 2","created_by":"openai","source":"official","family":"gpt-5.4","description":"[GPT-5.4](https://openrouter.ai/openai/gpt-5.4) Image 2 combines OpenAI's GPT-5.4 model with state-of-the-art image generation capabilities from GPT Image 2.","release_date":"2026-04-21","context_window":272000,"max_output_tokens":128000,"model_type":"chat","tagline":"[GPT-5.4](https://openrouter.ai/openai/gpt-5.4) Image 2 combines OpenAI's GPT-5.4 model with state-of-the-art image generation capabilities from GPT Image 2.","capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["image","text"],"output":["image","text"]},"pricing":{"input":8,"output":15,"cached_input":2},"last_updated":"2026-04-22"},{"id":"openai/gpt-5.4-mini","name":"OpenAI: GPT-5.4 Mini","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.4","description":"GPT-5.4 mini brings the core capabilities of GPT-5.4 to a faster, more efficient model optimized for high-throughput workloads.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":0.75,"output":4.5,"cached_input":0.075},"model_type":"chat","release_date":"2026-03-17","tagline":"GPT-5.4 mini brings the core capabilities of GPT-5.4 to a faster, more efficient model optimized for high-throughput workloads.","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.4-nano","name":"OpenAI: GPT-5.4 Nano","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.4","description":"GPT-5.4 nano is the most lightweight and cost-efficient variant of the GPT-5.4 family, optimized for speed-critical and high-volume tasks.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":0.2,"output":1.25,"cached_input":0.02},"model_type":"chat","release_date":"2026-03-17","tagline":"GPT-5.4 nano is the most lightweight and cost-efficient variant of the GPT-5.4 family, optimized for speed-critical and high-volume tasks.","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.4-pro","name":"OpenAI: GPT-5.4 Pro","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.4","description":"GPT-5.4 Pro is OpenAI's most advanced model, building on GPT-5.4's unified architecture with enhanced reasoning capabilities for complex, high-stakes tasks.","context_window":1050000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false},"pricing":{"input":30,"output":180},"model_type":"chat","release_date":"2026-03-05","tagline":"GPT-5.4 Pro is OpenAI's most advanced model, building on GPT-5.4's unified architecture with enhanced reasoning capabilities for complex, high-stakes tasks.","tools":["function_calling"],"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.4","name":"OpenAI: GPT-5.4","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5.4","description":"GPT-5.4 is OpenAI’s latest frontier model, unifying the Codex and GPT lines into a single system.","context_window":1050000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":2.5,"output":15,"cached_input":0.25},"model_type":"chat","release_date":"2026-03-05","tagline":"GPT-5.4 is OpenAI’s latest frontier model, unifying the Codex and GPT lines into a single system.","tools":["function_calling"],"knowledge_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.5-pro","name":"OpenAI: GPT-5.5 Pro","created_by":"openai","source":"official","family":"gpt-5.5","description":"GPT-5.5 Pro is OpenAI’s high-capability model optimized for deep reasoning and accuracy on complex, high-stakes workloads.","release_date":"2026-04-24","context_window":1050000,"max_output_tokens":128000,"model_type":"chat","tagline":"GPT-5.5 Pro is OpenAI’s high-capability model optimized for deep reasoning and accuracy on complex, high-stakes workloads.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":false,"vision":true,"fine_tuning":false,"batch":true},"modalities":{"input":["image","text"],"output":["text"]},"pricing":{"input":30,"output":180},"tools":["function_calling"],"last_updated":"2026-04-25","knowledge_cutoff":"2025-12","license":"proprietary","open_weight":false},{"id":"openai/gpt-5.5","name":"OpenAI: GPT-5.5","created_by":"openai","source":"official","family":"gpt-5.5","description":"GPT-5.5 is OpenAI’s frontier model designed for complex professional workloads, building on GPT-5.4 with stronger reasoning, higher reliability, and improved token efficiency on hard tasks.","release_date":"2026-04-24","context_window":1050000,"max_output_tokens":128000,"model_type":"chat","tagline":"GPT-5.5 is OpenAI’s frontier model designed for complex professional workloads, building on GPT-5.4 with stronger reasoning, higher reliability, and improved token efficiency on hard tasks.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"modalities":{"input":["image","text"],"output":["text"]},"pricing":{"input":5,"output":30,"cached_input":0.5},"tools":["function_calling"],"last_updated":"2026-04-25","knowledge_cutoff":"2025-12","license":"proprietary","open_weight":false},{"id":"openai/gpt-5","name":"OpenAI: GPT-5","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"gpt-5","description":"GPT-5 is OpenAI’s most advanced model, offering major improvements in reasoning, code quality, and user experience.","context_window":400000,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":1.25,"output":10,"cached_input":0.125},"model_type":"chat","release_date":"2025-08-07","tagline":"GPT-5 is OpenAI’s most advanced model, offering major improvements in reasoning, code quality, and user experience.","tools":["function_calling"],"max_input_tokens":272000,"knowledge_cutoff":"2024-09","license":"proprietary","open_weight":false},{"id":"openai/gpt-audio-mini","name":"OpenAI: GPT Audio Mini","created_by":"openai","source":"official","last_updated":"2026-04-01","family":"gpt-audio","description":"A cost-efficient version of GPT Audio.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","audio"],"output":["text","audio"]},"capabilities":{"structured_output":true,"json_mode":true,"tool_call":true,"streaming":false,"vision":false,"fine_tuning":false,"reasoning":false},"pricing":{"input":0.6,"output":2.4},"release_date":"2026-01-19","tagline":"A cost-efficient version of GPT Audio.","model_type":"chat","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-audio","name":"OpenAI: GPT Audio","created_by":"openai","source":"official","last_updated":"2026-04-01","family":"gpt-audio","description":"The gpt-audio model is OpenAI's first generally available audio model.","context_window":128000,"max_output_tokens":16384,"modalities":{"input":["text","audio"],"output":["text","audio"]},"capabilities":{"structured_output":true,"json_mode":true,"tool_call":true,"streaming":true,"vision":false,"fine_tuning":false,"reasoning":false},"pricing":{"input":2.5,"output":10},"release_date":"2026-01-19","tagline":"The gpt-audio model is OpenAI's first generally available audio model.","model_type":"chat","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/gpt-chat-latest","name":"OpenAI: GPT Chat Latest","created_by":"openai","source":"official","description":"GPT Chat Latest points to OpenAI's stable API alias `chat-latest` that always resolves to the latest Instant chat model used in ChatGPT.","release_date":"2026-05-05","context_window":400000,"max_output_tokens":128000,"tagline":"GPT Chat Latest points to OpenAI's stable API alias `chat-latest` that always resolves to the latest Instant chat model used in ChatGPT.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5,"output":30,"cached_input":0.5},"tools":["function_calling"],"last_updated":"2026-05-06"},{"id":"openai/gpt-oss-120b:free","name":"OpenAI: gpt-oss-120b (free)","created_by":"openai","source":"official","last_updated":"2026-03-23","family":"gpt-oss","description":"gpt-oss-120b is an open-weight, 117B-parameter Mixture-of-Experts (MoE) language model from OpenAI designed for high-reasoning, agentic, and general-purpose production use cases.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"model_type":"chat","release_date":"2025-08-05","tagline":"gpt-oss-120b is an open-weight, 117B-parameter Mixture-of-Experts (MoE) language model from OpenAI designed for high-reasoning, agentic, and general-purpose production use cases.","tools":["function_calling"]},{"id":"openai/gpt-oss-120b","name":"OpenAI: gpt-oss-120b","created_by":"openai","source":"official","last_updated":"2026-06-29","family":"gpt-oss","description":"gpt-oss-120b is an open-weight, 117B-parameter Mixture-of-Experts (MoE) language model from OpenAI designed for high-reasoning, agentic, and general-purpose production use cases.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":false,"vision":false,"batch":true},"pricing":{"input":0.03,"output":0.15},"model_type":"chat","parameters":120,"release_date":"2025-08-05","tagline":"gpt-oss-120b is an open-weight, 117B-parameter Mixture-of-Experts (MoE) language model from OpenAI designed for high-reasoning, agentic, and general-purpose production use cases.","tools":["function_calling"],"max_output_tokens":131072,"knowledge_cutoff":"2024-06","license":"apache-2.0","open_weight":true},{"id":"openai/gpt-oss-20b:free","name":"OpenAI: gpt-oss-20b (free)","created_by":"openai","source":"official","last_updated":"2026-06-18","family":"gpt-oss","description":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.0 license.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true},"model_type":"chat","release_date":"2025-08-05","tagline":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.0 license.","tools":["function_calling"]},{"id":"openai/gpt-oss-20b","name":"OpenAI: gpt-oss-20b","created_by":"openai","source":"official","last_updated":"2026-06-02","family":"gpt-oss","description":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.0 license.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":false,"vision":false,"batch":true},"pricing":{"input":0.029,"output":0.14,"cached_input":0.015},"model_type":"chat","parameters":20,"release_date":"2025-08-05","tagline":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.0 license.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"apache-2.0","open_weight":true},{"id":"openai/gpt-oss-safeguard-20b","name":"OpenAI: gpt-oss-safeguard-20b","created_by":"openai","source":"official","last_updated":"2026-06-20","family":"gpt-oss","description":"gpt-oss-safeguard-20b is a safety reasoning model from OpenAI built upon gpt-oss-20b.","context_window":131072,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.075,"output":0.3,"cached_input":0.038},"model_type":"moderation","parameters":20,"release_date":"2025-10-29","tagline":"gpt-oss-safeguard-20b is a safety reasoning model from OpenAI built upon gpt-oss-20b.","tools":["function_calling"]},{"id":"openai/o1-pro","name":"OpenAI: o1-pro","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o1","description":"The o1 series of models are trained with reinforcement learning to think before they answer and perform complex reasoning.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true,"vision":true,"tool_call":true,"streaming":false,"fine_tuning":false,"batch":true},"pricing":{"input":150,"output":600},"model_type":"reasoning","release_date":"2025-03-19","tagline":"The o1 series of models are trained with reinforcement learning to think before they answer and perform complex reasoning.","knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/o1","name":"OpenAI: o1","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o1","description":"The latest and strongest model family from OpenAI, o1 is designed to spend more time thinking before responding.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":15,"output":60,"cached_input":7.5},"model_type":"reasoning","release_date":"2024-12-17","tagline":"The latest and strongest model family from OpenAI, o1 is designed to spend more time thinking before responding.","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/o3-deep-research","name":"OpenAI: o3 Deep Research","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o3","description":"o3-deep-research is OpenAI's advanced model for deep research, designed to tackle complex, multi-step research tasks.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":10,"output":40,"cached_input":2.5},"model_type":"chat","release_date":"2025-10-10","tagline":"o3-deep-research is OpenAI's advanced model for deep research, designed to tackle complex, multi-step research tasks.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openai/o3-mini-high","name":"OpenAI: o3 Mini High","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o3","description":"OpenAI o3-mini-high is the same model as [o3-mini](/openai/o3-mini) with reasoning_effort set to high.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":1.1,"output":4.4,"cached_input":0.55},"model_type":"reasoning","release_date":"2025-02-12","tagline":"OpenAI o3-mini-high is the same model as [o3-mini](/openai/o3-mini) with reasoning_effort set to high.","tools":["function_calling"]},{"id":"openai/o3-mini","name":"OpenAI: o3 Mini","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o3","description":"OpenAI o3-mini is a cost-efficient language model optimized for STEM reasoning tasks, particularly excelling in science, mathematics, and coding.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":false,"fine_tuning":false,"batch":true},"pricing":{"input":1.1,"output":4.4,"cached_input":0.55},"model_type":"reasoning","release_date":"2025-01-31","tagline":"OpenAI o3-mini is a cost-efficient language model optimized for STEM reasoning tasks, particularly excelling in science, mathematics, and coding.","tools":["function_calling"],"knowledge_cutoff":"2023-10","license":"proprietary","open_weight":false},{"id":"openai/o3-pro","name":"OpenAI: o3 Pro","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o3","description":"The o-series of models are trained with reinforcement learning to think before they answer and perform complex reasoning.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"vision":true,"streaming":false,"fine_tuning":false,"batch":true},"pricing":{"input":20,"output":80},"model_type":"reasoning","release_date":"2025-06-10","tagline":"The o-series of models are trained with reinforcement learning to think before they answer and perform complex reasoning.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openai/o3","name":"OpenAI: o3","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o3","description":"o3 is a well-rounded and powerful model across domains.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":2,"output":8,"cached_input":0.5},"model_type":"reasoning","release_date":"2025-04-16","tagline":"o3 is a well-rounded and powerful model across domains.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openai/o4-mini-deep-research","name":"OpenAI: o4 Mini Deep Research","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o4","description":"o4-mini-deep-research is OpenAI's faster, more affordable deep research model—ideal for tackling complex, multi-step research tasks.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":false,"batch":true},"pricing":{"input":2,"output":8,"cached_input":0.5},"model_type":"chat","release_date":"2025-10-10","tagline":"o4-mini-deep-research is OpenAI's faster, more affordable deep research model—ideal for tackling complex, multi-step research tasks.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openai/o4-mini-high","name":"OpenAI: o4 Mini High","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o4","description":"OpenAI o4-mini-high is the same model as [o4-mini](/openai/o4-mini) with reasoning_effort set to high.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":1.1,"output":4.4,"cached_input":0.275},"model_type":"reasoning","release_date":"2025-04-16","tagline":"OpenAI o4-mini-high is the same model as [o4-mini](/openai/o4-mini) with reasoning_effort set to high.","tools":["function_calling"]},{"id":"openai/o4-mini","name":"OpenAI: o4 Mini","created_by":"openai","source":"official","last_updated":"2026-03-24","family":"o4","description":"OpenAI o4-mini is a compact reasoning model in the o-series, optimized for fast, cost-efficient performance while retaining strong multimodal and agentic capabilities.","context_window":200000,"max_output_tokens":100000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true,"batch":true},"pricing":{"input":1.1,"output":4.4,"cached_input":0.275},"model_type":"reasoning","release_date":"2025-04-16","tagline":"OpenAI o4-mini is a compact reasoning model in the o-series, optimized for fast, cost-efficient performance while retaining strong multimodal and agentic capabilities.","tools":["function_calling"],"knowledge_cutoff":"2024-06","license":"proprietary","open_weight":false},{"id":"openrouter/auto","name":"Auto Router","created_by":"openrouter","source":"official","last_updated":"2026-05-10","description":"Your prompt will be processed by a meta-model and routed to one of dozens of models (see below), optimizing for the best possible output.","context_window":2000000,"modalities":{"input":["text","image","audio","video"],"output":["text","image"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"release_date":"2023-11-08","tagline":"Your prompt will be processed by a meta-model and routed to one of dozens of models (see below), optimizing for the best possible output.","tools":["function_calling"]},{"id":"openrouter/bodybuilder","name":"Body Builder (beta)","created_by":"openrouter","source":"official","last_updated":"2026-03-23","description":"Transform your natural language requests into structured OpenRouter API request objects.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"release_date":"2025-12-05","tagline":"Transform your natural language requests into structured OpenRouter API request objects."},{"id":"openrouter/elephant-alpha","name":"Elephant","created_by":"openrouter","source":"official","description":"Elephant Alpha is a 100B-parameter text model focused on intelligence efficiency, delivering strong performance while minimizing token usage.","release_date":"2026-04-13","context_window":262144,"max_output_tokens":32768,"tagline":"Elephant Alpha is a 100B-parameter text model focused on intelligence efficiency, delivering strong reasoning performance while minimizing token usage.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-16"},{"id":"openrouter/free","name":"Free Models Router","created_by":"openrouter","source":"official","last_updated":"2026-03-24","description":"The simplest way to get free inference.","context_window":200000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"release_date":"2026-02-01","tagline":"The simplest way to get free inference.","tools":["function_calling"]},{"id":"openrouter/fusion","name":"OpenRouter: Fusion","created_by":"openrouter","source":"official","description":"Fusion turns your prompt into a small multi-model deliberation.","release_date":"2026-06-13","context_window":1000000,"tagline":"Fusion turns your prompt into a small multi-model deliberation.","modalities":{"input":["text"],"output":["text"]},"last_updated":"2026-06-18"},{"id":"openrouter/owl-alpha","name":"Owl Alpha","created_by":"openrouter","source":"official","description":"Owl Alpha is a high-performance foundation model designed for agentic workloads.","release_date":"2026-04-28","context_window":1048756,"max_output_tokens":262144,"tagline":"Owl Alpha is a high-performance foundation model designed for agentic workloads.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-05-01"},{"id":"openrouter/pareto-code","name":"Pareto Code Router","created_by":"openrouter","source":"official","description":"The Pareto Router maintains a tiered shortlist of strong coding models, ranked by [Artificial Analysis](https://artificialanalysis.ai/) coding percentiles.","release_date":"2026-04-21","context_window":2000000,"tagline":"The Pareto Router is a way to have OpenRouter always pick a strong coding model for your needs without committing to a specific one.","modalities":{"input":["text"],"output":["text"]},"last_updated":"2026-05-10"},{"id":"perceptron/perceptron-mk1","name":"Perceptron: Perceptron Mk1","created_by":"perceptron","source":"official","description":"Perceptron Mk1 (Mark One) is Perceptron's highest-quality vision-language model for video and embodied reasoning.** It accepts image and video inputs paired with natural language queries, and produces","release_date":"2026-05-12","context_window":32768,"max_output_tokens":8192,"tagline":"Perceptron Mk1 (Mark One) is Perceptron's highest-quality vision-language model for video and embodied reasoning.** It accepts image and video inputs paired with natural language queries, and produces","capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.15,"output":1.5},"last_updated":"2026-05-14"},{"id":"perplexity/sonar-deep-research","name":"Perplexity: Sonar Deep Research","created_by":"perplexity","source":"official","last_updated":"2026-03-23","description":"Sonar Deep Research is a research-focused model designed for multi-step retrieval, synthesis, and reasoning across complex topics.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"reasoning":true},"pricing":{"input":2,"output":8},"family":"sonar","model_type":"chat","release_date":"2025-03-07","tagline":"Sonar Deep Research is a research-focused model designed for multi-step retrieval, synthesis, and reasoning across complex topics."},{"id":"perplexity/sonar-pro-search","name":"Perplexity: Sonar Pro Search","created_by":"perplexity","source":"official","last_updated":"2026-03-24","description":"Exclusively available on the OpenRouter API, Sonar Pro's new Pro Search mode is Perplexity's most advanced agentic search system.","context_window":200000,"max_output_tokens":8000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":3,"output":15},"family":"sonar","model_type":"chat","release_date":"2025-10-30","tagline":"Exclusively available on the OpenRouter API, Sonar Pro's new Pro Search mode is Perplexity's most advanced agentic search system."},{"id":"perplexity/sonar-pro","name":"Perplexity: Sonar Pro","created_by":"perplexity","source":"official","last_updated":"2026-03-23","description":"Note: Sonar Pro pricing includes Perplexity search pricing.","context_window":200000,"max_output_tokens":8000,"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":3,"output":15},"family":"sonar","model_type":"chat","release_date":"2025-03-07","tagline":"Note: Sonar Pro pricing includes Perplexity search pricing."},{"id":"perplexity/sonar-reasoning-pro","name":"Perplexity: Sonar Reasoning Pro","created_by":"perplexity","source":"official","last_updated":"2026-03-23","description":"Note: Sonar Pro pricing includes Perplexity search pricing.","context_window":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"reasoning":true},"pricing":{"input":2,"output":8},"model_type":"reasoning","family":"sonar","release_date":"2025-03-07","tagline":"Note: Sonar Pro pricing includes Perplexity search pricing."},{"id":"perplexity/sonar","name":"Perplexity: Sonar","created_by":"perplexity","source":"official","last_updated":"2026-03-23","description":"Sonar is lightweight, affordable, fast, and simple to use — now featuring citations and the ability to customize sources.","context_window":127072,"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1,"output":1},"family":"sonar","model_type":"chat","release_date":"2025-01-27","tagline":"Sonar is lightweight, affordable, fast, and simple to use — now featuring citations and the ability to customize sources."},{"id":"poolside/laguna-m.1:free","name":"Poolside: Laguna M.1 (free)","created_by":"poolside","source":"official","description":"Laguna M.1 is the flagship coding agent model from [Poolside](https://poolside.ai/), optimized for complex software engineering tasks.","release_date":"2026-04-28","context_window":262144,"max_output_tokens":32768,"tagline":"Laguna M.1 is the flagship coding agent model from [Poolside](https://poolside.ai), optimized for complex software engineering tasks.","capabilities":{"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-20"},{"id":"poolside/laguna-m.1","name":"Poolside: Laguna M.1","created_by":"poolside","source":"official","description":"Laguna M.1 is the flagship coding agent model from [Poolside](https://poolside.ai/), optimized for complex software engineering tasks.","release_date":"2026-04-28","context_window":262144,"max_output_tokens":32768,"tagline":"Laguna M.1 is the flagship coding agent model from [Poolside](https://poolside.ai/), optimized for complex software engineering tasks.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.2,"output":0.4,"cached_input":0.1},"tools":["function_calling"],"last_updated":"2026-06-20"},{"id":"poolside/laguna-xs.2:free","name":"Poolside: Laguna XS.2 (free)","created_by":"poolside","source":"official","description":"Laguna XS.2 is the second-generation model in the XS size class from [Poolside](https://poolside.ai/), their efficient coding agent series.","release_date":"2026-04-28","context_window":262144,"max_output_tokens":32768,"tagline":"Laguna XS.2 is the second-generation model in the XS size class from [Poolside](https://poolside.ai), their efficient coding agent series.","capabilities":{"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-06-30","status":"deprecated","deprecation_date":"9999-01-01"},{"id":"poolside/laguna-xs.2","name":"Poolside: Laguna XS.2","created_by":"poolside","source":"official","description":"Laguna XS.2 is the second-generation model in the XS size class from [Poolside](https://poolside.ai/), their efficient coding agent series.","release_date":"2026-04-28","context_window":262144,"max_output_tokens":32768,"tagline":"Laguna XS.2 is the second-generation model in the XS size class from [Poolside](https://poolside.ai/), their efficient coding agent series.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.1,"output":0.2,"cached_input":0.05},"tools":["function_calling"],"last_updated":"2026-06-20"},{"id":"prime-intellect/intellect-3","name":"Prime Intellect: INTELLECT-3","created_by":"prime-intellect","source":"official","last_updated":"2026-03-24","description":"INTELLECT-3 is a 106B-parameter Mixture-of-Experts model (12B active) post-trained from GLM-4.5-Air-Base using supervised fine-tuning (SFT) followed by large-scale reinforcement learning (RL).","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.2,"output":1.1},"release_date":"2025-11-27","tagline":"INTELLECT-3 is a 106B-parameter Mixture-of-Experts model (12B active) post-trained from GLM-4.5-Air-Base using supervised fine-tuning (SFT) followed by large-scale reinforcement learning (RL).","tools":["function_calling"]},{"id":"qwen/qwen-2.5-72b-instruct","name":"Qwen2.5 72B Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen","description":"Qwen2.5 72B is the latest series of Qwen large language models.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true,"reasoning":true,"batch":true},"pricing":{"input":0.36,"output":0.4},"model_type":"chat","parameters":72,"release_date":"2024-09-19","tagline":"Qwen2.5 72B is the latest series of Qwen large language models.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen-2.5-7b-instruct","name":"Qwen: Qwen2.5 7B Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen","description":"Qwen2.5 7B is the latest series of Qwen large language models.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true,"reasoning":true,"batch":true},"pricing":{"input":0.04,"output":0.1},"model_type":"chat","parameters":7,"release_date":"2024-10-16","tagline":"Qwen2.5 7B is the latest series of Qwen large language models.","tools":["function_calling"],"max_output_tokens":32768,"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen-2.5-coder-32b-instruct","name":"Qwen2.5 Coder 32B Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-23","family":"qwen","description":"Qwen2.5-Coder is the latest series of Code-Specific Qwen large language models (formerly known as CodeQwen).","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.66,"output":1},"model_type":"code","parameters":32,"release_date":"2024-11-11","tagline":"Qwen2.5-Coder is the latest series of Code-Specific Qwen large language models (formerly known as CodeQwen).","max_output_tokens":32768},{"id":"qwen/qwen-2.5-vl-7b-instruct","name":"Qwen: Qwen2.5-VL 7B Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-23","family":"qwen","description":"Qwen2.5 VL 7B is a multimodal LLM from the Qwen Team with the following key enhancements:\n\n- SoTA understanding of images of various resolution & ratio: Qwen2.5-VL achieves state-of-the-art performanc","context_window":32768,"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.2,"output":0.2},"model_type":"chat","parameters":7,"release_date":"2024-08-28","tagline":"Qwen2.5 VL 7B is a multimodal LLM from the Qwen Team with the following key enhancements:\n\n- SoTA understanding of images of various resolution & ratio: Qwen2.5-VL achieves state-of-the-art performanc","license":"apache-2.0","open_weight":true,"capabilities":{"streaming":true,"reasoning":true,"tool_call":true,"structured_output":true,"batch":true,"vision":true,"fine_tuning":true,"json_mode":true}},{"id":"qwen/qwen-max","name":"Qwen: Qwen-Max ","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen","description":"Qwen-Max, based on Qwen2.5, provides the best inference performance among [Qwen models](/qwen), especially for complex multi-step tasks.","context_window":32768,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true},"pricing":{"input":1.04,"output":4.16,"cached_input":0.208},"model_type":"chat","release_date":"2025-02-01","tagline":"Qwen-Max, based on Qwen2.5, provides the best inference performance among [Qwen models](/qwen), especially for complex multi-step tasks.","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"qwen/qwen-plus-2025-07-28:thinking","name":"Qwen: Qwen Plus 0728 (thinking)","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen","description":"Qwen Plus 0728, based on the Qwen3 foundation model, is a 1 million context hybrid reasoning model with a balanced performance, speed, and cost combination.","context_window":1000000,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.26,"output":0.78},"model_type":"chat","release_date":"2025-09-08","tagline":"Qwen Plus 0728, based on the Qwen3 foundation model, is a 1 million context hybrid reasoning model with a balanced performance, speed, and cost combination.","tools":["function_calling"]},{"id":"qwen/qwen-plus-2025-07-28","name":"Qwen: Qwen Plus 0728","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen","description":"Qwen Plus 0728, based on the Qwen3 foundation model, is a 1 million context hybrid reasoning model with a balanced performance, speed, and cost combination.","context_window":1000000,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.26,"output":0.78,"cached_input":0.052},"model_type":"chat","release_date":"2025-09-08","alias":"qwen/qwen-plus","tagline":"Qwen Plus 0728, based on the Qwen3 foundation model, is a 1 million context hybrid reasoning model with a balanced performance, speed, and cost combination.","tools":["function_calling"]},{"id":"qwen/qwen-plus","name":"Qwen: Qwen-Plus","created_by":"qwen","source":"official","last_updated":"2026-03-26","family":"qwen","description":"Qwen-Plus, based on the Qwen2.5 foundation model, is a 131K context model with a balanced performance, speed, and cost combination.","context_window":1000000,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true},"pricing":{"input":0.26,"output":0.78,"cached_input":0.052},"model_type":"chat","release_date":"2025-02-01","tagline":"Qwen Plus 0728, based on the Qwen3 foundation model, is a 1 million context hybrid reasoning model with a balanced performance, speed, and cost combination.","tools":["function_calling"],"snapshots":["qwen/qwen-plus-2025-07-28"],"license":"proprietary","open_weight":false},{"id":"qwen/qwen-turbo","name":"Qwen: Qwen-Turbo","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen","description":"Qwen-Turbo, based on Qwen2.5, is a 1M context model that provides fast speed and low cost, suitable for simple tasks.","context_window":131072,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true},"pricing":{"input":0.033,"output":0.13,"cached_input":0.007},"model_type":"chat","release_date":"2025-02-01","tagline":"Qwen-Turbo, based on Qwen2.5, is a 1M context model that provides fast speed and low cost, suitable for simple tasks.","tools":["function_calling"],"license":"proprietary","open_weight":false},{"id":"qwen/qwen-vl-max","name":"Qwen: Qwen VL Max","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen","description":"Qwen VL Max is a visual understanding model with 7500 tokens context length.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.52,"output":2.08},"model_type":"chat","release_date":"2025-02-01","tagline":"Qwen VL Max is a visual understanding model with 7500 tokens context length.","tools":["function_calling"]},{"id":"qwen/qwen-vl-plus","name":"Qwen: Qwen VL Plus","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen","description":"Qwen's Enhanced Large Visual Language Model.","context_window":131072,"max_output_tokens":8192,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.137,"output":0.41,"cached_input":0.027},"model_type":"chat","release_date":"2025-02-05","tagline":"Qwen's Enhanced Large Visual Language Model."},{"id":"qwen/qwen2.5-coder-7b-instruct","name":"Qwen: Qwen2.5 Coder 7B Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen2.5","description":"Qwen2.5-Coder-7B-Instruct is a 7B parameter instruction-tuned language model optimized for code-related tasks such as code generation, reasoning, and bug fixing.","context_window":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.03,"output":0.09},"model_type":"code","parameters":7,"release_date":"2025-04-15","tagline":"Qwen2.5-Coder-7B-Instruct is a 7B parameter instruction-tuned language model optimized for code-related tasks such as code generation, reasoning, and bug fixing."},{"id":"qwen/qwen2.5-vl-32b-instruct","name":"Qwen: Qwen2.5 VL 32B Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen2.5","description":"Qwen2.5-VL-32B is a multimodal vision-language model fine-tuned through reinforcement learning for enhanced mathematical reasoning, structured outputs, and visual problem-solving capabilities.","context_window":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"tool_call":true,"batch":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.2,"output":0.6},"model_type":"chat","parameters":32,"release_date":"2025-03-24","tagline":"Qwen2.5-VL-32B is a multimodal vision-language model fine-tuned through reinforcement learning for enhanced mathematical reasoning, structured outputs, and visual problem-solving capabilities.","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen2.5-vl-72b-instruct","name":"Qwen: Qwen2.5 VL 72B Instruct","created_by":"qwen","source":"official","last_updated":"2026-06-18","family":"qwen2.5","description":"Qwen2.5-VL is proficient in recognizing common objects such as flowers, birds, fish, and insects.","context_window":131072,"max_output_tokens":128000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"tool_call":true,"batch":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.8,"output":1,"cached_input":0.4},"model_type":"chat","parameters":72,"release_date":"2025-02-01","tagline":"Qwen2.5-VL is proficient in recognizing common objects such as flowers, birds, fish, and insects.","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-14b","name":"Qwen: Qwen3 14B","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-14B is a dense 14.8B parameter causal language model from the Qwen3 series, designed for both complex reasoning and efficient dialogue.","context_window":131702,"max_output_tokens":40960,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.1,"output":0.24},"model_type":"chat","parameters":14,"release_date":"2025-04-28","tagline":"Qwen3-14B is a dense 14.8B parameter causal language model from the Qwen3 series, designed for both complex reasoning and efficient dialogue.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-235b-a22b-2507","name":"Qwen: Qwen3 235B A22B Instruct 2507","created_by":"qwen","source":"official","last_updated":"2026-06-10","family":"qwen3","description":"Qwen3-235B-A22B-Instruct-2507 is a multilingual, instruction-tuned mixture-of-experts language model based on the Qwen3-235B architecture, with 22B active parameters per forward pass.","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.09,"output":0.1},"model_type":"chat","parameters":235,"active_parameters":22,"release_date":"2025-07-21","max_output_tokens":16384,"alias":"qwen/qwen3-235b-a22b","tagline":"Qwen3-235B-A22B-Instruct-2507 is a multilingual, instruction-tuned mixture-of-experts language model based on the Qwen3-235B architecture, with 22B active parameters per forward pass.","tools":["function_calling"]},{"id":"qwen/qwen3-235b-a22b-thinking-2507","name":"Qwen: Qwen3 235B A22B Thinking 2507","created_by":"qwen","source":"official","last_updated":"2026-06-02","family":"qwen3","description":"Qwen3-235B-A22B-Thinking-2507 is a high-performance, open-weight Mixture-of-Experts (MoE) language model optimized for complex reasoning tasks.","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.1,"output":0.1,"cached_input":0.1},"model_type":"chat","parameters":235,"active_parameters":22,"release_date":"2025-07-25","alias":"qwen/qwen3-235b-a22b-thinking","tagline":"Qwen3-235B-A22B-Thinking-2507 is a high-performance, open-weight Mixture-of-Experts (MoE) language model optimized for complex reasoning tasks.","tools":["function_calling"],"max_output_tokens":262144,"status":"deprecated","deprecation_date":"2026-04-22","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-235b-a22b-thinking","name":"Qwen: Qwen3 235B A22B Thinking 2507","created_by":"qwen","source":"official","last_updated":"2026-06-02","family":"qwen3","description":"Qwen3-235B-A22B-Thinking-2507 is a high-performance, open-weight Mixture-of-Experts (MoE) language model optimized for complex reasoning tasks.","release_date":"2025-07-25","context_window":262144,"parameters":235,"active_parameters":22,"model_type":"chat","tagline":"Qwen3-235B-A22B-Thinking-2507 is a high-performance, open-weight Mixture-of-Experts (MoE) language model optimized for complex reasoning tasks.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.1,"output":0.1,"cached_input":0.1},"tools":["function_calling"],"snapshots":["qwen/qwen3-235b-a22b-thinking-2507"],"max_output_tokens":262144,"status":"deprecated","deprecation_date":"2026-04-22","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-235b-a22b","name":"Qwen: Qwen3 235B A22B","created_by":"qwen","source":"official","last_updated":"2026-03-26","family":"qwen3","description":"Qwen3-235B-A22B is a 235B parameter mixture-of-experts (MoE) model developed by Qwen, activating 22B parameters per forward pass.","context_window":131072,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.455,"output":1.82},"model_type":"chat","parameters":235,"active_parameters":22,"release_date":"2025-04-28","tagline":"Qwen3-235B-A22B-Instruct-2507 is a multilingual, instruction-tuned mixture-of-experts language model based on the Qwen3-235B architecture, with 22B active parameters per forward pass.","tools":["function_calling"],"snapshots":["qwen/qwen3-235b-a22b-2507"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-30b-a3b-instruct-2507","name":"Qwen: Qwen3 30B A3B Instruct 2507","created_by":"qwen","source":"official","last_updated":"2026-06-10","family":"qwen3","description":"Qwen3-30B-A3B-Instruct-2507 is a 30.5B-parameter mixture-of-experts language model from Qwen, with 3.3B active parameters per inference.","context_window":131072,"max_output_tokens":32000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.048,"output":0.193},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-07-29","alias":"qwen/qwen3-30b-a3b-instruct","tagline":"Qwen3-30B-A3B-Instruct-2507 is a 30.5B-parameter mixture-of-experts language model from Qwen, with 3.3B active parameters per inference.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-30b-a3b-instruct","name":"Qwen: Qwen3 30B A3B Instruct 2507","created_by":"qwen","source":"official","last_updated":"2026-06-10","family":"qwen3","description":"Qwen3-30B-A3B-Instruct-2507 is a 30.5B-parameter mixture-of-experts language model from Qwen, with 3.3B active parameters per inference.","release_date":"2025-07-29","context_window":131072,"max_output_tokens":32000,"parameters":30,"active_parameters":3,"model_type":"chat","tagline":"Qwen3-30B-A3B-Instruct-2507 is a 30.5B-parameter mixture-of-experts language model from Qwen, with 3.3B active parameters per inference.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.048,"output":0.193},"tools":["function_calling"],"snapshots":["qwen/qwen3-30b-a3b-instruct-2507"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-30b-a3b-thinking-2507","name":"Qwen: Qwen3 30B A3B Thinking 2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-30B-A3B-Thinking-2507 is a 30B parameter Mixture-of-Experts reasoning model optimized for complex tasks requiring extended multi-step thinking.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.08,"output":0.4,"cached_input":0.08},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-08-28","alias":"qwen/qwen3-30b-a3b-thinking","tagline":"Qwen3-30B-A3B-Thinking-2507 is a 30B parameter Mixture-of-Experts reasoning model optimized for complex tasks requiring extended multi-step thinking.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-30b-a3b-thinking","name":"Qwen: Qwen3 30B A3B Thinking 2507","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-30B-A3B-Thinking-2507 is a 30B parameter Mixture-of-Experts reasoning model optimized for complex tasks requiring extended multi-step thinking.","release_date":"2025-08-28","context_window":131072,"max_output_tokens":131072,"parameters":30,"active_parameters":3,"model_type":"chat","tagline":"Qwen3-30B-A3B-Thinking-2507 is a 30B parameter Mixture-of-Experts reasoning model optimized for complex tasks requiring extended multi-step thinking.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.08,"output":0.4,"cached_input":0.08},"tools":["function_calling"],"snapshots":["qwen/qwen3-30b-a3b-thinking-2507"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-30b-a3b","name":"Qwen: Qwen3 30B A3B","created_by":"qwen","source":"official","last_updated":"2026-06-10","family":"qwen3","description":"Qwen3, the latest generation in the Qwen large language model series, features both dense and mixture-of-experts (MoE) architectures to excel in reasoning, multilingual support, and advanced agent tasks.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.12,"output":0.5},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-04-28","tagline":"Qwen3, the latest generation in the Qwen large language model series, features both dense and mixture-of-experts (MoE) architectures to excel in reasoning, multilingual support, and advanced agent tas","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-06-05","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-32b","name":"Qwen: Qwen3 32B","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-32B is a dense 32.8B parameter causal language model from the Qwen3 series, optimized for both complex reasoning and efficient dialogue.","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.08,"output":0.28,"cached_input":0.04},"model_type":"chat","parameters":32,"release_date":"2025-04-28","tagline":"Qwen3-32B is a dense 32.8B parameter causal language model from the Qwen3 series, optimized for both complex reasoning and efficient dialogue.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-4b:free","name":"Qwen: Qwen3 4B (free)","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-4B is a 4 billion parameter dense language model from the Qwen3 series, designed to support both general-purpose and reasoning-intensive tasks.","status":"deprecated","deprecation_date":"2026-03-29","context_window":40960,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"model_type":"chat","release_date":"2025-04-30","tagline":"Qwen3-4B is a 4 billion parameter dense language model from the Qwen3 series, designed to support both general-purpose and reasoning-intensive tasks.","tools":["function_calling"]},{"id":"qwen/qwen3-8b","name":"Qwen: Qwen3 8B","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-8B is a dense 8.2B parameter causal language model from the Qwen3 series, designed for both reasoning-heavy tasks and efficient dialogue.","context_window":131072,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.05,"output":0.4,"cached_input":0.05},"model_type":"chat","parameters":8,"release_date":"2025-04-28","tagline":"Qwen3-8B is a dense 8.2B parameter causal language model from the Qwen3 series, designed for both reasoning-heavy tasks and efficient dialogue.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-coder-30b-a3b-instruct","name":"Qwen: Qwen3 Coder 30B A3B Instruct","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-Coder-30B-A3B-Instruct is a 30.5B parameter Mixture-of-Experts (MoE) model with 128 experts (8 active per forward pass), designed for advanced code generation, repository-scale understanding, and agentic tool use.","context_window":160000,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.07,"output":0.27},"model_type":"code","parameters":30,"active_parameters":3,"release_date":"2025-07-31","tagline":"Qwen3-Coder-30B-A3B-Instruct is a 30.5B parameter Mixture-of-Experts (MoE) model with 128 experts (8 active per forward pass), designed for advanced code generation, repository-scale understanding, an","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-coder-flash","name":"Qwen: Qwen3 Coder Flash","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3 Coder Flash is Alibaba's fast and cost efficient version of their proprietary Qwen3 Coder Plus.","context_window":1000000,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.195,"output":0.975,"cached_input":0.039},"model_type":"code","release_date":"2025-09-17","tagline":"Qwen3 Coder Flash is Alibaba's fast and cost efficient version of their proprietary Qwen3 Coder Plus.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-coder:free","name":"Qwen: Qwen3 Coder 480B A35B (free)","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-Coder-480B-A35B-Instruct is a Mixture-of-Experts (MoE) code generation model developed by the Qwen team.","context_window":1048576,"max_output_tokens":262000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true},"model_type":"code","parameters":480,"active_parameters":35,"release_date":"2025-07-23","tagline":"Qwen3-Coder-480B-A35B-Instruct is a Mixture-of-Experts (MoE) code generation model developed by the Qwen team.","tools":["function_calling"]},{"id":"qwen/qwen3-coder-next","name":"Qwen: Qwen3 Coder Next","created_by":"qwen","source":"official","last_updated":"2026-05-07","family":"qwen3","description":"Qwen3-Coder-Next is an open-weight causal language model optimized for coding agents and local development workflows.","context_window":262144,"max_output_tokens":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true,"reasoning":true,"batch":true},"pricing":{"input":0.11,"output":0.8,"cached_input":0.07},"model_type":"code","release_date":"2026-02-04","tagline":"Qwen3-Coder-Next is an open-weight causal language model optimized for coding agents and local development workflows.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-coder-plus","name":"Qwen: Qwen3 Coder Plus","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3 Coder Plus is Alibaba's proprietary version of the Open Source Qwen3 Coder 480B A35B.","context_window":1000000,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true,"reasoning":true,"batch":true},"pricing":{"input":0.65,"output":3.25,"cached_input":0.13},"model_type":"code","release_date":"2025-09-23","tagline":"Qwen3 Coder Plus is Alibaba's proprietary version of the Open Source Qwen3 Coder 480B A35B.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-coder","name":"Qwen: Qwen3 Coder 480B A35B","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-Coder-480B-A35B-Instruct is a Mixture-of-Experts (MoE) code generation model developed by the Qwen team.","context_window":1048576,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.22,"output":1.8,"cached_input":0.022},"model_type":"code","parameters":480,"active_parameters":35,"release_date":"2025-07-23","tagline":"Qwen3-Coder-480B-A35B-Instruct is a Mixture-of-Experts (MoE) code generation model developed by the Qwen team.","tools":["function_calling"],"max_output_tokens":65536},{"id":"qwen/qwen3-max-thinking","name":"Qwen: Qwen3 Max Thinking","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-Max-Thinking is the flagship reasoning model in the Qwen3 series, designed for high-stakes cognitive tasks that require deep, multi-step reasoning.","context_window":262144,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.78,"output":3.9},"model_type":"chat","release_date":"2026-02-09","tagline":"Qwen3-Max-Thinking is the flagship reasoning model in the Qwen3 series, designed for high-stakes cognitive tasks that require deep, multi-step reasoning.","tools":["function_calling"]},{"id":"qwen/qwen3-max","name":"Qwen: Qwen3 Max","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-Max is an updated release built on the Qwen3 series, offering major improvements in reasoning, instruction following, multilingual support, and long-tail knowledge coverage compared to the January 2025 version.","context_window":262144,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"fine_tuning":true,"batch":true},"pricing":{"input":0.78,"output":3.9,"cached_input":0.156},"model_type":"chat","release_date":"2025-09-23","tagline":"Qwen3-Max is an updated release built on the Qwen3 series, offering major improvements in reasoning, instruction following, multilingual support, and long-tail knowledge coverage compared to the Janua","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-next-80b-a3b-instruct:free","name":"Qwen: Qwen3 Next 80B A3B Instruct (free)","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-Next-80B-A3B-Instruct is an instruction-tuned chat model in the Qwen3-Next series optimized for fast, stable responses without “thinking” traces.","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"model_type":"chat","parameters":80,"active_parameters":3,"release_date":"2025-09-11","tagline":"Qwen3-Next-80B-A3B-Instruct is an instruction-tuned chat model in the Qwen3-Next series optimized for fast, stable responses without “thinking” traces.","tools":["function_calling"]},{"id":"qwen/qwen3-next-80b-a3b-instruct","name":"Qwen: Qwen3 Next 80B A3B Instruct","created_by":"qwen","source":"official","last_updated":"2026-04-25","family":"qwen3","description":"Qwen3-Next-80B-A3B-Instruct is an instruction-tuned chat model in the Qwen3-Next series optimized for fast, stable responses without “thinking” traces.","context_window":262144,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"reasoning":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.09,"output":1.1},"model_type":"chat","parameters":80,"active_parameters":3,"release_date":"2025-09-11","tagline":"Qwen3-Next-80B-A3B-Instruct is an instruction-tuned chat model in the Qwen3-Next series optimized for fast, stable responses without “thinking” traces.","tools":["function_calling"],"max_output_tokens":16384,"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-next-80b-a3b-thinking","name":"Qwen: Qwen3 Next 80B A3B Thinking","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-Next-80B-A3B-Thinking is a reasoning-first chat model in the Qwen3-Next line that outputs structured “thinking” traces by default.","context_window":262144,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"pricing":{"input":0.098,"output":0.78},"model_type":"chat","parameters":80,"active_parameters":3,"release_date":"2025-09-11","tagline":"Qwen3-Next-80B-A3B-Thinking is a reasoning-first chat model in the Qwen3-Next line that outputs structured “thinking” traces by default.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-vl-235b-a22b-instruct","name":"Qwen: Qwen3 VL 235B A22B Instruct","created_by":"qwen","source":"official","last_updated":"2026-04-25","family":"qwen3","description":"Qwen3-VL-235B-A22B Instruct is an open-weight multimodal model that unifies strong text generation with visual understanding across images and video.","context_window":262144,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"reasoning":true,"fine_tuning":true},"pricing":{"input":0.2,"output":0.88,"cached_input":0.11},"model_type":"chat","parameters":235,"active_parameters":22,"release_date":"2025-09-23","tagline":"Qwen3-VL-235B-A22B Instruct is an open-weight multimodal model that unifies strong text generation with visual understanding across images and video.","tools":["function_calling"],"max_output_tokens":16384,"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-vl-235b-a22b-thinking","name":"Qwen: Qwen3 VL 235B A22B Thinking","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-VL-235B-A22B Thinking is a multimodal model that unifies strong text generation with visual understanding across images and video.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.26,"output":2.6},"model_type":"chat","parameters":235,"active_parameters":22,"release_date":"2025-09-23","tagline":"Qwen3-VL-235B-A22B Thinking is a multimodal model that unifies strong text generation with visual understanding across images and video.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-vl-30b-a3b-instruct","name":"Qwen: Qwen3 VL 30B A3B Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-VL-30B-A3B-Instruct is a multimodal model that unifies strong text generation with visual understanding for images and videos.","context_window":262144,"max_output_tokens":32768,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"reasoning":true,"fine_tuning":true},"pricing":{"input":0.13,"output":0.52},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-10-06","tagline":"Qwen3-VL-30B-A3B-Instruct is a multimodal model that unifies strong text generation with visual understanding for images and videos.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-vl-30b-a3b-thinking","name":"Qwen: Qwen3 VL 30B A3B Thinking","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3","description":"Qwen3-VL-30B-A3B-Thinking is a multimodal model that unifies strong text generation with visual understanding for images and videos.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.13,"output":1.56},"model_type":"chat","parameters":30,"active_parameters":3,"release_date":"2025-10-06","tagline":"Qwen3-VL-30B-A3B-Thinking is a multimodal model that unifies strong text generation with visual understanding for images and videos.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-vl-32b-instruct","name":"Qwen: Qwen3 VL 32B Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-VL-32B-Instruct is a large-scale multimodal vision-language model designed for high-precision understanding and reasoning across text, images, and video.","context_window":262144,"max_output_tokens":32768,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"reasoning":true,"fine_tuning":true},"pricing":{"input":0.104,"output":0.416},"model_type":"chat","parameters":32,"release_date":"2025-10-23","tagline":"Qwen3-VL-32B-Instruct is a large-scale multimodal vision-language model designed for high-precision understanding and reasoning across text, images, and video.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-vl-8b-instruct","name":"Qwen: Qwen3 VL 8B Instruct","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-VL-8B-Instruct is a multimodal vision-language model from the Qwen3-VL series, built for high-fidelity understanding and reasoning across text, images, and video.","context_window":256000,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"vision":true,"reasoning":true,"fine_tuning":true},"pricing":{"input":0.08,"output":0.5},"model_type":"chat","parameters":8,"release_date":"2025-10-14","tagline":"Qwen3-VL-8B-Instruct is a multimodal vision-language model from the Qwen3-VL series, built for high-fidelity understanding and reasoning across text, images, and video.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3-vl-8b-thinking","name":"Qwen: Qwen3 VL 8B Thinking","created_by":"qwen","source":"official","last_updated":"2026-05-17","family":"qwen3","description":"Qwen3-VL-8B-Thinking is the reasoning-optimized variant of the Qwen3-VL-8B multimodal model, designed for advanced visual and textual reasoning across complex scenes, documents, and temporal sequences.","context_window":256000,"max_output_tokens":32768,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true,"fine_tuning":true},"pricing":{"input":0.117,"output":1.365},"model_type":"chat","parameters":8,"release_date":"2025-10-14","tagline":"Qwen3-VL-8B-Thinking is the reasoning-optimized variant of the Qwen3-VL-8B multimodal model, designed for advanced visual and textual reasoning across complex scenes, documents, and temporal sequences","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.5-122b-a10b","name":"Qwen: Qwen3.5-122B-A10B","created_by":"qwen","source":"official","last_updated":"2026-05-23","family":"qwen3.5","description":"The Qwen3.5 122B-A10B native vision-language model is built on a hybrid architecture that integrates a linear attention mechanism with a sparse mixture-of-experts model, achieving higher inference efficiency.","context_window":262144,"max_output_tokens":262144,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true,"batch":true},"pricing":{"input":0.26,"output":2.08},"model_type":"chat","parameters":122,"active_parameters":10,"release_date":"2026-02-25","tagline":"The Qwen3.5 122B-A10B native vision-language model is built on a hybrid architecture that integrates a linear attention mechanism with a sparse mixture-of-experts model, achieving higher inference eff","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.5-27b","name":"Qwen: Qwen3.5-27B","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3.5","description":"The Qwen3.5 27B native vision-language Dense model incorporates a linear attention mechanism, delivering fast response times while balancing inference speed and performance.","context_window":262144,"max_output_tokens":65536,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true,"batch":true},"pricing":{"input":0.195,"output":1.56},"model_type":"chat","parameters":27,"release_date":"2026-02-25","tagline":"The Qwen3.5 27B native vision-language Dense model incorporates a linear attention mechanism, delivering fast response times while balancing inference speed and performance.","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.5-35b-a3b","name":"Qwen: Qwen3.5-35B-A3B","created_by":"qwen","source":"official","last_updated":"2026-06-29","family":"qwen3.5","description":"The Qwen3.5 Series 35B-A3B is a native vision-language model designed with a hybrid architecture that integrates linear attention mechanisms and a sparse mixture-of-experts model, achieving higher inference efficiency.","context_window":262144,"max_output_tokens":81920,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true,"batch":true},"pricing":{"input":0.14,"output":1,"cached_input":0.05},"model_type":"chat","parameters":35,"active_parameters":3,"release_date":"2026-02-25","tagline":"The Qwen3.5 Series 35B-A3B is a native vision-language model designed with a hybrid architecture that integrates linear attention mechanisms and a sparse mixture-of-experts model, achieving higher inf","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.5-397b-a17b","name":"Qwen: Qwen3.5 397B A17B","created_by":"qwen","source":"official","last_updated":"2026-06-18","family":"qwen3.5","description":"The Qwen3.5 series 397B-A17B native vision-language model is built on a hybrid architecture that integrates a linear attention mechanism with a sparse mixture-of-experts model, achieving higher inference efficiency.","context_window":256000,"max_output_tokens":65536,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true,"batch":true},"pricing":{"input":0.385,"output":2.45,"cached_input":0.195},"model_type":"chat","parameters":397,"active_parameters":17,"release_date":"2026-02-16","tagline":"The Qwen3.5 series 397B-A17B native vision-language model is built on a hybrid architecture that integrates a linear attention mechanism with a sparse mixture-of-experts model, achieving higher infere","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.5-9b","name":"Qwen: Qwen3.5-9B","created_by":"qwen","source":"official","last_updated":"2026-06-10","family":"qwen3.5","description":"Qwen3.5-9B is a multimodal foundation model from the Qwen3.5 family, designed to deliver strong reasoning, coding, and visual understanding in an efficient 9B-parameter architecture.","context_window":262144,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.1,"output":0.15},"model_type":"chat","parameters":9,"release_date":"2026-03-10","tagline":"Qwen3.5-9B is a multimodal foundation model from the Qwen3.5 family, designed to deliver strong reasoning, coding, and visual understanding in an efficient 9B-parameter architecture.","tools":["function_calling"],"max_output_tokens":262144},{"id":"qwen/qwen3.5-flash-02-23","name":"Qwen: Qwen3.5-Flash","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3.5","description":"The Qwen3.5 native vision-language Flash models are built on a hybrid architecture that integrates a linear attention mechanism with a sparse mixture-of-experts model, achieving higher inference efficiency.","context_window":1000000,"max_output_tokens":65536,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.065,"output":0.26},"model_type":"chat","release_date":"2026-02-25","tagline":"The Qwen3.5 native vision-language Flash models are built on a hybrid architecture that integrates a linear attention mechanism with a sparse mixture-of-experts model, achieving higher inference effic","tools":["function_calling"]},{"id":"qwen/qwen3.5-plus-02-15","name":"Qwen: Qwen3.5 Plus 2026-02-15","created_by":"qwen","source":"official","last_updated":"2026-03-24","family":"qwen3.5","description":"The Qwen3.5 native vision-language series Plus models are built on a hybrid architecture that integrates linear attention mechanisms with sparse mixture-of-experts models, achieving higher inference efficiency.","context_window":1000000,"max_output_tokens":65536,"modalities":{"input":["text","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.26,"output":1.56},"model_type":"chat","release_date":"2026-02-16","tagline":"The Qwen3.5 native vision-language series Plus models are built on a hybrid architecture that integrates linear attention mechanisms with sparse mixture-of-experts models, achieving higher inference e","tools":["function_calling"]},{"id":"qwen/qwen3.5-plus-20260420","name":"Qwen: Qwen3.5 Plus 2026-04-20","created_by":"qwen","source":"official","family":"qwen3.5","description":"Qwen3.5 Plus (April 2026) is a large-scale multimodal language model from Alibaba.","release_date":"2026-04-27","context_window":1000000,"max_output_tokens":65536,"model_type":"chat","alias":"qwen/qwen3.5-plus","tagline":"Qwen3.5 Plus (April 2026) is a large-scale multimodal language model from Alibaba.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.3,"output":1.8},"tools":["function_calling"],"last_updated":"2026-05-17"},{"id":"qwen/qwen3.5-plus","name":"Qwen: Qwen3.5 Plus 2026-04-20","created_by":"qwen","source":"official","family":"qwen3.5","description":"Qwen3.5 Plus (April 2026) is a large-scale multimodal language model from Alibaba.","release_date":"2026-04-27","context_window":1000000,"max_output_tokens":65536,"model_type":"chat","tagline":"Qwen3.5 Plus (April 2026) is a large-scale multimodal language model from Alibaba.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.3,"output":1.8},"tools":["function_calling"],"snapshots":["qwen/qwen3.5-plus-20260420"],"last_updated":"2026-05-17","license":"proprietary","open_weight":false},{"id":"qwen/qwen3.6-27b","name":"Qwen: Qwen3.6 27B","created_by":"qwen","source":"official","family":"qwen3.6","description":"Qwen3.6 27B is a dense 27-billion-parameter language model from the Qwen Team at Alibaba, released in April 2026.","release_date":"2026-04-27","context_window":262144,"max_output_tokens":262140,"parameters":27,"model_type":"chat","tagline":"Qwen3.6 27B is a dense 27-billion-parameter language model from the Qwen Team at Alibaba, released in April 2026.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.26,"output":2.385},"tools":["function_calling"],"last_updated":"2026-06-29","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.6-35b-a3b","name":"Qwen: Qwen3.6 35B A3B","created_by":"qwen","source":"official","family":"qwen3.6","description":"Qwen3.6-35B-A3B is an open-weight multimodal model from Alibaba Cloud with 35 billion total parameters and 3 billion active parameters per token.","release_date":"2026-04-27","context_window":262144,"max_output_tokens":262144,"parameters":35,"active_parameters":3,"model_type":"chat","tagline":"Qwen3.6-35B-A3B is an open-weight multimodal model from Alibaba Cloud with 35 billion total parameters and 3 billion active parameters per token.","capabilities":{"structured_output":true,"reasoning":true,"json_mode":true,"tool_call":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.14,"output":1,"cached_input":0.05},"last_updated":"2026-06-20","tools":["function_calling"],"license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.6-flash","name":"Qwen: Qwen3.6 Flash","created_by":"qwen","source":"official","family":"qwen3.6","description":"Qwen3.6 Flash is a fast, efficient language model from Alibaba's Qwen 3.6 series.","release_date":"2026-04-27","context_window":1000000,"max_output_tokens":65536,"model_type":"chat","tagline":"Qwen3.6 Flash is a fast, efficient language model from Alibaba's Qwen 3.6 series.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true,"batch":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.188,"output":1.125},"tools":["function_calling"],"last_updated":"2026-05-17","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.6-max-preview","name":"Qwen: Qwen3.6 Max Preview","created_by":"qwen","source":"official","family":"qwen3.6","description":"Qwen3.6-Max-Preview is a proprietary frontier model from Alibaba Cloud built on a sparse mixture-of-experts architecture with approximately 1 trillion total parameters.","release_date":"2026-04-27","context_window":262144,"max_output_tokens":65536,"model_type":"chat","tagline":"Qwen3.6-Max-Preview is a proprietary frontier model from Alibaba Cloud built on a sparse mixture-of-experts architecture with approximately 1 trillion total parameters.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true,"batch":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1.04,"output":6.24},"tools":["function_calling"],"last_updated":"2026-05-01","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.6-plus:free","name":"Qwen: Qwen3.6 Plus (free)","created_by":"qwen","source":"official","family":"qwen3.6","description":"Qwen 3.6 Plus builds on a hybrid architecture that combines efficient linear attention with sparse mixture-of-experts routing, enabling strong scalability and high-performance inference.","release_date":"2026-04-02","context_window":1000000,"max_output_tokens":65536,"model_type":"chat","tagline":"Qwen 3.6 Plus builds on a hybrid architecture that combines efficient linear attention with sparse mixture-of-experts routing, enabling strong scalability and high-performance inference.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image","video"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-03"},{"id":"qwen/qwen3.6-plus-preview:free","name":"Qwen: Qwen3.6 Plus Preview (free)","created_by":"qwen","source":"official","family":"qwen3.6","description":"Qwen 3.6 Plus Preview is the next-generation evolution of the Qwen Plus series, featuring an advanced hybrid architecture that improves efficiency and scalability.","release_date":"2026-03-30","context_window":1000000,"max_output_tokens":32000,"model_type":"chat","tagline":"Qwen 3.6 Plus Preview is the next-generation evolution of the Qwen Plus series, featuring an advanced hybrid architecture that improves efficiency and scalability.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-01"},{"id":"qwen/qwen3.6-plus","name":"Qwen: Qwen3.6 Plus","created_by":"qwen","source":"official","family":"qwen3.6","description":"Qwen 3.6 Plus builds on a hybrid architecture that combines efficient linear attention with sparse mixture-of-experts routing, enabling strong scalability and high-performance inference.","release_date":"2026-04-02","context_window":1000000,"max_output_tokens":65536,"model_type":"chat","tagline":"Qwen 3.6 Plus builds on a hybrid architecture that combines efficient linear attention with sparse mixture-of-experts routing, enabling strong scalability and high-performance inference.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true,"batch":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.325,"output":1.95},"tools":["function_calling"],"last_updated":"2026-04-08","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.7-max","name":"Qwen: Qwen3.7 Max","created_by":"qwen","source":"official","family":"qwen3.7","description":"Qwen3.7-Max is the flagship model in Alibaba's Qwen3.7 series.","release_date":"2026-05-21","context_window":1000000,"max_output_tokens":65536,"model_type":"chat","tagline":"Qwen3.7-Max is the flagship model in Alibaba's Qwen3.7 series.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":1.25,"output":3.75,"cached_input":0.25},"tools":["function_calling"],"last_updated":"2026-05-29","license":"apache-2.0","open_weight":true},{"id":"qwen/qwen3.7-plus","name":"Qwen: Qwen3.7 Plus","created_by":"qwen","source":"official","family":"qwen3.7","description":"Qwen3.7-Plus is a cost-effective model in Alibaba's Qwen3.7 series.","release_date":"2026-06-03","context_window":1000000,"max_output_tokens":65536,"model_type":"chat","tagline":"Qwen3.7-Plus is a cost-effective model in Alibaba's Qwen3.7 series.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.32,"output":1.28,"cached_input":0.064},"tools":["function_calling"],"last_updated":"2026-06-18","license":"apache-2.0","open_weight":true},{"id":"qwen/qwq-32b","name":"Qwen: QwQ 32B","created_by":"qwen","source":"official","last_updated":"2026-04-22","family":"qwq","description":"QwQ is the reasoning model of the Qwen series.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.15,"output":0.58},"model_type":"chat","parameters":32,"release_date":"2025-03-05","tagline":"QwQ is the reasoning model of the Qwen series.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-04-29","license":"apache-2.0","open_weight":true},{"id":"reka/reka-edge","name":"Reka Edge","created_by":"reka","source":"official","description":"Reka Edge is an extremely efficient 7B multimodal vision-language model that accepts image/video+text inputs and generates text outputs.","release_date":"2026-03-20","context_window":16384,"max_output_tokens":16384,"tagline":"Reka Edge is an extremely efficient 7B multimodal vision-language model that accepts image/video+text inputs and generates text outputs.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"vision":true,"streaming":true},"modalities":{"input":["image","text","video"],"output":["text"]},"pricing":{"input":0.1,"output":0.1},"tools":["function_calling"],"last_updated":"2026-03-27","license":"proprietary","open_weight":false},{"id":"rekaai/reka-edge","name":"Reka Edge","created_by":"rekaai","source":"official","description":"Reka Edge is an extremely efficient 7B multimodal vision-language model that accepts image/video+text inputs and generates text outputs.","release_date":"2026-03-20","context_window":16384,"max_output_tokens":16384,"tagline":"Reka Edge is an extremely efficient 7B multimodal vision-language model that accepts image/video+text inputs and generates text outputs.","capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"modalities":{"input":["image","text","video"],"output":["text"]},"pricing":{"input":0.1,"output":0.1},"tools":["function_calling"],"last_updated":"2026-04-03"},{"id":"rekaai/reka-flash-3","name":"Reka Flash 3","created_by":"rekaai","source":"official","description":"Reka Flash 3 is a general-purpose, instruction-tuned large language model with 21 billion parameters, developed by Reka.","release_date":"2025-03-12","context_window":65536,"max_output_tokens":65536,"tagline":"Reka Flash 3 is a general-purpose, instruction-tuned large language model with 21 billion parameters, developed by Reka.","capabilities":{"reasoning":true,"structured_output":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.1,"output":0.2},"last_updated":"2026-06-20"},{"id":"relace/relace-apply-3","name":"Relace: Relace Apply 3","created_by":"relace","source":"official","last_updated":"2026-03-23","description":"Relace Apply 3 is a specialized code-patching LLM that merges AI-suggested edits straight into your source files.","context_window":256000,"max_output_tokens":128000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.85,"output":1.25},"release_date":"2025-09-26","tagline":"Relace Apply 3 is a specialized code-patching LLM that merges AI-suggested edits straight into your source files."},{"id":"relace/relace-search","name":"Relace: Relace Search","created_by":"relace","source":"official","last_updated":"2026-06-20","description":"The relace-search model uses 4-12 `view_file` and `grep` tools in parallel to explore a codebase and return relevant files to the user request.","context_window":256000,"max_output_tokens":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":1,"output":3},"model_type":"chat","release_date":"2025-12-08","tagline":"The relace-search model uses 4-12 `view_file` and `grep` tools in parallel to explore a codebase and return relevant files to the user request.","tools":["function_calling"]},{"id":"sakana/fugu-ultra","name":"Sakana: Fugu Ultra","created_by":"sakana","source":"official","description":"Fugu Ultra is the higher-performance model in Sakana AI's Fugu family.","release_date":"2026-06-24","context_window":1000000,"max_output_tokens":128000,"tagline":"Fugu Ultra is the higher-performance model in Sakana AI's Fugu family.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5,"output":30,"cached_input":0.5},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"sao10k/l3-euryale-70b","name":"Sao10k: Llama 3 Euryale 70B v2.1","created_by":"sao10k","source":"official","last_updated":"2026-05-29","description":"Euryale 70B v2.1 is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k).","context_window":8192,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":1.48,"output":1.48},"parameters":70,"release_date":"2024-06-18","tagline":"Euryale 70B v2.1 is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k).","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-06-05"},{"id":"sao10k/l3-lunaris-8b","name":"Sao10K: Llama 3 8B Lunaris","created_by":"sao10k","source":"official","last_updated":"2026-04-25","description":"Lunaris 8B is a versatile generalist and roleplaying model based on Llama 3.","context_window":8192,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.04,"output":0.05},"parameters":8,"release_date":"2024-08-13","tagline":"Lunaris 8B is a versatile generalist and roleplaying model based on Llama 3.","max_output_tokens":16384},{"id":"sao10k/l3.1-70b-hanami-x1","name":"Sao10K: Llama 3.1 70B Hanami x1","created_by":"sao10k","source":"official","last_updated":"2026-06-20","description":"This is [Sao10K](/sao10k)'s experiment over [Euryale v2.2](/sao10k/l3.1-euryale-70b).","context_window":16000,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":3,"output":3},"parameters":70,"release_date":"2025-01-08","tagline":"This is [Sao10K](/sao10k)'s experiment over [Euryale v2.2](/sao10k/l3.1-euryale-70b).","capabilities":{"structured_output":true,"json_mode":true}},{"id":"sao10k/l3.1-euryale-70b","name":"Sao10K: Llama 3.1 Euryale 70B v2.2","created_by":"sao10k","source":"official","last_updated":"2026-03-24","description":"Euryale L3.1 70B v2.2 is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k).","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.85,"output":0.85},"parameters":70,"release_date":"2024-08-28","tagline":"Euryale L3.1 70B v2.2 is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k).","tools":["function_calling"]},{"id":"sao10k/l3.3-euryale-70b","name":"Sao10K: Llama 3.3 Euryale 70B","created_by":"sao10k","source":"official","last_updated":"2026-03-24","description":"Euryale L3.3 70B is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k).","context_window":131072,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.65,"output":0.75},"parameters":70,"release_date":"2024-12-18","tagline":"Euryale L3.3 70B is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k)."},{"id":"stepfun/step-3.5-flash:free","name":"StepFun: Step 3.5 Flash (free)","created_by":"stepfun","source":"official","last_updated":"2026-03-23","description":"Step 3.5 Flash is StepFun's most capable open-source foundation model.","context_window":256000,"max_output_tokens":256000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"release_date":"2026-01-29","tagline":"Step 3.5 Flash is StepFun's most capable open-source foundation model.","tools":["function_calling"]},{"id":"stepfun/step-3.5-flash","name":"StepFun: Step 3.5 Flash","created_by":"stepfun","source":"official","last_updated":"2026-06-30","description":"Step 3.5 Flash is StepFun's most capable open-source foundation model.","context_window":262144,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.1,"output":0.3,"cached_input":0.02},"release_date":"2026-01-29","tagline":"Step 3.5 Flash is StepFun's most capable open-source foundation model.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-06-29","license":"apache-2.0","open_weight":true},{"id":"stepfun/step-3.7-flash","name":"StepFun: Step 3.7 Flash","created_by":"stepfun","source":"official","description":"Step 3.7 Flash is StepFun's latest high-efficiency multimodal Mixture-of-Experts model.","release_date":"2026-05-28","context_window":256000,"max_output_tokens":256000,"tagline":"Step 3.7 Flash is StepFun's latest high-efficiency multimodal Mixture-of-Experts model.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image","video"],"output":["text"]},"pricing":{"input":0.2,"output":1.15,"cached_input":0.04},"tools":["function_calling"],"last_updated":"2026-06-02"},{"id":"switchpoint/router","name":"Switchpoint Router","created_by":"switchpoint","source":"official","last_updated":"2026-06-20","description":"Switchpoint AI's router instantly analyzes your request and directs it to the optimal AI from an ever-evolving library.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"reasoning":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.85,"output":3.4},"release_date":"2025-07-11","tagline":"Switchpoint AI's router instantly analyzes your request and directs it to the optimal AI from an ever-evolving library."},{"id":"tencent/hunyuan-a13b-instruct","name":"Tencent: Hunyuan A13B Instruct","created_by":"tencent","source":"official","last_updated":"2026-03-24","description":"Hunyuan-A13B is a 13B active parameter Mixture-of-Experts (MoE) language model developed by Tencent, with a total parameter count of 80B and support for reasoning via Chain-of-Thought.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.14,"output":0.57},"release_date":"2025-07-08","tagline":"Hunyuan-A13B is a 13B active parameter Mixture-of-Experts (MoE) language model developed by Tencent, with a total parameter count of 80B and support for reasoning via Chain-of-Thought."},{"id":"tencent/hy3-preview:free","name":"Tencent: Hy3 preview (free)","created_by":"tencent","source":"official","description":"Hy3 preview is a high-efficiency Mixture-of-Experts model from Tencent designed for agentic workflows and production use.","release_date":"2026-04-22","context_window":262144,"max_output_tokens":262144,"tagline":"Hy3 preview is a high-efficiency Mixture-of-Experts model from Tencent designed for agentic workflows and production use.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"tools":["function_calling"],"last_updated":"2026-04-25","status":"deprecated","deprecation_date":"2026-05-08"},{"id":"tencent/hy3-preview","name":"Tencent: Hy3 preview","created_by":"tencent","source":"official","description":"Hy3 preview is a high-efficiency Mixture-of-Experts model from Tencent designed for agentic workflows and production use.","release_date":"2026-04-22","context_window":262144,"max_output_tokens":262144,"tagline":"Hy3 preview is a high-efficiency Mixture-of-Experts model from Tencent designed for agentic workflows and production use.","capabilities":{"tool_call":true,"reasoning":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.063,"output":0.21,"cached_input":0.021},"tools":["function_calling"],"last_updated":"2026-06-20"},{"id":"thedrummer/cydonia-24b-v4.1","name":"TheDrummer: Cydonia 24B V4.1","created_by":"thedrummer","source":"official","last_updated":"2026-06-18","description":"Uncensored and creative writing model based on Mistral Small 3.2 24B with good recall, prompt adherence, and intelligence.","context_window":131072,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.3,"output":0.5,"cached_input":0.15},"parameters":24,"release_date":"2025-09-27","tagline":"Uncensored and creative writing model based on Mistral Small 3.2 24B with good recall, prompt adherence, and intelligence.","capabilities":{"structured_output":true,"json_mode":true}},{"id":"thedrummer/rocinante-12b","name":"TheDrummer: Rocinante 12B","created_by":"thedrummer","source":"official","last_updated":"2026-06-29","description":"Rocinante 12B is designed for engaging storytelling and rich prose.","context_window":32768,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.25,"output":0.5},"parameters":12,"release_date":"2024-09-30","tagline":"Rocinante 12B is designed for engaging storytelling and rich prose.","tools":["function_calling"]},{"id":"thedrummer/skyfall-36b-v2","name":"TheDrummer: Skyfall 36B V2","created_by":"thedrummer","source":"official","last_updated":"2026-06-20","description":"Skyfall 36B v2 is an enhanced iteration of Mistral Small 2501, specifically fine-tuned for improved creativity, nuanced writing, role-playing, and coherent storytelling.","context_window":32768,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.55,"output":0.8,"cached_input":0.25},"parameters":36,"release_date":"2025-03-10","tagline":"Skyfall 36B v2 is an enhanced iteration of Mistral Small 2501, specifically fine-tuned for improved creativity, nuanced writing, role-playing, and coherent storytelling.","capabilities":{"structured_output":true,"json_mode":true}},{"id":"thedrummer/unslopnemo-12b","name":"TheDrummer: UnslopNemo 12B","created_by":"thedrummer","source":"official","last_updated":"2026-03-24","description":"UnslopNemo v4.1 is the latest addition from the creator of Rocinante, designed for adventure writing and role-play scenarios.","context_window":32768,"max_output_tokens":32768,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":0.4,"output":0.4},"parameters":12,"release_date":"2024-11-08","tagline":"UnslopNemo v4.1 is the latest addition from the creator of Rocinante, designed for adventure writing and role-play scenarios.","tools":["function_calling"]},{"id":"tngtech/deepseek-r1t2-chimera","name":"TNG: DeepSeek R1T2 Chimera","created_by":"tngtech","source":"official","last_updated":"2026-03-24","family":"deepseek-r1","description":"DeepSeek-TNG-R1T2-Chimera is the second-generation Chimera model from TNG Tech.","context_window":163840,"max_output_tokens":163840,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.3,"output":1.1,"cached_input":0.15},"model_type":"reasoning","release_date":"2025-07-08","tagline":"DeepSeek-TNG-R1T2-Chimera is the second-generation Chimera model from TNG Tech.","tools":["function_calling"]},{"id":"undi95/remm-slerp-l2-13b","name":"ReMM SLERP 13B","created_by":"undi95","source":"official","last_updated":"2026-03-24","description":"A recreation trial of the original MythoMax-L2-B13 but with updated models.","context_window":6144,"max_output_tokens":4096,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"structured_output":true,"json_mode":true},"pricing":{"input":0.45,"output":0.65},"parameters":13,"release_date":"2023-07-22","tagline":"A recreation trial of the original MythoMax-L2-B13 but with updated models."},{"id":"upstage/solar-pro-3","name":"Upstage: Solar Pro 3","created_by":"upstage","source":"official","last_updated":"2026-03-24","description":"Solar Pro 3 is Upstage's powerful Mixture-of-Experts (MoE) language model.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.15,"output":0.6,"cached_input":0.015},"release_date":"2026-01-27","tagline":"Solar Pro 3 is Upstage's powerful Mixture-of-Experts (MoE) language model.","tools":["function_calling"]},{"id":"writer/palmyra-x5","name":"Writer: Palmyra X5","created_by":"writer","source":"official","last_updated":"2026-03-23","description":"Palmyra X5 is Writer's most advanced model, purpose-built for building and scaling AI agents across the enterprise.","context_window":1040000,"max_output_tokens":8192,"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.6,"output":6},"model_type":"chat","release_date":"2026-01-21","tagline":"Palmyra X5 is Writer's most advanced model, purpose-built for building and scaling AI agents across the enterprise.","license":"proprietary","open_weight":false,"capabilities":{"vision":true,"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true}},{"id":"x-ai/grok-3-beta","name":"xAI: Grok 3 Beta","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-3","description":"Grok 3 is the latest model from xAI.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true},"pricing":{"input":3,"output":15,"cached_input":0.75},"model_type":"chat","release_date":"2025-04-09","tagline":"Grok 3 is the latest model from xAI.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15"},{"id":"x-ai/grok-3-mini-beta","name":"xAI: Grok 3 Mini Beta","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-3","description":"Grok 3 Mini is a lightweight, smaller thinking model.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.3,"output":0.5,"cached_input":0.075},"model_type":"chat","release_date":"2025-04-09","tagline":"Grok 3 Mini is a lightweight, smaller thinking model.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15"},{"id":"x-ai/grok-3-mini","name":"xAI: Grok 3 Mini","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-3","description":"A lightweight model that thinks before responding.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true},"pricing":{"input":0.3,"output":0.5,"cached_input":0.075},"model_type":"chat","release_date":"2025-06-10","tagline":"A lightweight model that thinks before responding.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15","knowledge_cutoff":"2024-11","license":"proprietary","open_weight":false},{"id":"x-ai/grok-3","name":"xAI: Grok 3","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-3","description":"Grok 3 is the latest model from xAI.","context_window":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"json_mode":true,"streaming":true,"batch":true},"pricing":{"input":3,"output":15,"cached_input":0.75},"model_type":"chat","release_date":"2025-06-10","tagline":"Grok 3 is the latest model from xAI.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15","knowledge_cutoff":"2024-11","license":"proprietary","open_weight":false},{"id":"x-ai/grok-4-fast","name":"xAI: Grok 4 Fast","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-4","description":"Grok 4 Fast is xAI's latest multimodal model with SOTA cost-efficiency and a 2M token context window.","context_window":2000000,"max_output_tokens":30000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.2,"output":0.5,"cached_input":0.05},"model_type":"chat","release_date":"2025-09-19","tagline":"Grok 4 Fast is xAI's latest multimodal model with SOTA cost-efficiency and a 2M token context window.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15"},{"id":"x-ai/grok-4.1-fast","name":"xAI: Grok 4.1 Fast","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-4.1","description":"Grok 4.1 Fast is xAI's best agentic tool calling model that shines in real-world use cases like customer support and deep research.","context_window":2000000,"max_output_tokens":30000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.2,"output":0.5,"cached_input":0.05},"model_type":"chat","release_date":"2025-11-19","tagline":"Grok 4.1 Fast is xAI's best agentic tool calling model that shines in real-world use cases like customer support and deep research.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15"},{"id":"x-ai/grok-4.20-beta","name":"xAI: Grok 4.20 Beta","created_by":"xai","source":"official","last_updated":"2026-03-24","family":"grok-4.20","description":"Grok 4.20 Beta is xAI's newest flagship model with industry-leading speed and agentic tool calling capabilities.","context_window":2000000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":2,"output":6,"cached_input":0.2},"model_type":"chat","release_date":"2026-03-12","tagline":"Grok 4.20 Beta is xAI's newest flagship model with industry-leading speed and agentic tool calling capabilities.","tools":["function_calling"]},{"id":"x-ai/grok-4.20-multi-agent-beta","name":"xAI: Grok 4.20 Multi-Agent Beta","created_by":"xai","source":"official","last_updated":"2026-03-24","family":"grok-4.20","description":"Grok 4.20 Multi-Agent Beta is a variant of xAI’s Grok 4.20 designed for collaborative, agent-based workflows.","context_window":2000000,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":2,"output":6,"cached_input":0.2},"model_type":"chat","release_date":"2026-03-12","tagline":"Grok 4.20 Multi-Agent Beta is a variant of xAI’s Grok 4.20 designed for collaborative, agent-based workflows."},{"id":"x-ai/grok-4.20-multi-agent","name":"xAI: Grok 4.20 Multi-Agent","created_by":"xai","source":"official","family":"grok-4.20","description":"Grok 4.20 Multi-Agent is a variant of xAI’s Grok 4.20 designed for collaborative, agent-based workflows.","release_date":"2026-03-31","context_window":2000000,"model_type":"chat","tagline":"Grok 4.20 Multi-Agent is a variant of xAI’s Grok 4.20 designed for collaborative, agent-based workflows.","capabilities":{"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":2.5,"cached_input":0.2},"last_updated":"2026-06-18"},{"id":"x-ai/grok-4.20","name":"xAI: Grok 4.20","created_by":"xai","source":"official","family":"grok-4.20","description":"Grok 4.20 is a reasoning model from xAI with industry-leading speed and agentic tool calling capabilities.","release_date":"2026-03-31","context_window":2000000,"model_type":"chat","tagline":"Grok 4.20 is xAI's newest flagship model with industry-leading speed and agentic tool calling capabilities.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":2.5,"cached_input":0.2},"tools":["function_calling"],"last_updated":"2026-05-10"},{"id":"x-ai/grok-4.3","name":"xAI: Grok 4.3","created_by":"xai","source":"official","family":"grok-4.3","description":"Grok 4.3 is a reasoning model from xAI.","release_date":"2026-04-30","context_window":1000000,"model_type":"chat","tagline":"Grok 4.3 is a reasoning model from xAI.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":2.5,"cached_input":0.2},"tools":["function_calling"],"last_updated":"2026-05-01","knowledge_cutoff":"2024-11","license":"proprietary","open_weight":false},{"id":"x-ai/grok-4","name":"xAI: Grok 4","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-4","description":"Grok 4 is xAI's latest reasoning model with a 256k context window.","context_window":256000,"modalities":{"input":["image","text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":3,"output":15,"cached_input":0.75},"model_type":"chat","release_date":"2025-07-09","tagline":"Grok 4 is xAI's latest reasoning model with a 256k context window.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15"},{"id":"x-ai/grok-build-0.1","name":"xAI: Grok Build 0.1","created_by":"xai","source":"official","description":"Grok Build 0.1 is xAI’s fast coding model trained specifically for agentic software engineering workflows.","release_date":"2026-05-20","context_window":256000,"model_type":"chat","tagline":"Grok Build 0.1 is xAI’s fast coding model trained specifically for agentic software engineering workflows.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1,"output":2,"cached_input":0.2},"tools":["function_calling"],"last_updated":"2026-05-23","license":"proprietary","open_weight":false},{"id":"x-ai/grok-code-fast-1","name":"xAI: Grok Code Fast 1","created_by":"xai","source":"official","last_updated":"2026-05-07","family":"grok-code","description":"Grok Code Fast 1 is a speedy and economical reasoning model that excels at agentic coding.","context_window":256000,"max_output_tokens":10000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"batch":true},"pricing":{"input":0.2,"output":1.5,"cached_input":0.02},"model_type":"code","release_date":"2025-08-26","tagline":"Grok Code Fast 1 is a speedy and economical reasoning model that excels at agentic coding.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-15","license":"proprietary","open_weight":false},{"id":"xiaomi/mimo-v2-flash","name":"Xiaomi: MiMo-V2-Flash","created_by":"xiaomi","source":"official","last_updated":"2026-05-10","description":"MiMo-V2-Flash is an open-source foundation language model developed by Xiaomi.","context_window":262144,"max_output_tokens":65536,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"fine_tuning":true},"pricing":{"input":0.1,"output":0.3,"cached_input":0.01},"release_date":"2025-12-14","tagline":"MiMo-V2-Flash is an open-source foundation language model developed by Xiaomi.","tools":["function_calling"],"family":"mimo","model_type":"chat","knowledge_cutoff":"2024-12","license":"mit","parameters":309,"active_parameters":15,"architecture":"moe","open_weight":true},{"id":"xiaomi/mimo-v2-omni","name":"Xiaomi: MiMo-V2-Omni","created_by":"xiaomi","source":"official","last_updated":"2026-05-29","description":"MiMo-V2-Omni is a frontier omni-modal model that natively processes image, video, and audio inputs within a unified architecture.","context_window":262144,"max_output_tokens":65536,"modalities":{"input":["text","audio","image","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true},"pricing":{"input":0.4,"output":2,"cached_input":0.08},"release_date":"2026-03-18","tagline":"MiMo-V2-Omni is a frontier omni-modal model that natively processes image, video, and audio inputs within a unified architecture.","tools":["function_calling"],"family":"mimo","model_type":"chat","status":"deprecated","deprecation_date":"2026-05-31","license":"proprietary","open_weight":false},{"id":"xiaomi/mimo-v2-pro","name":"Xiaomi: MiMo-V2-Pro","created_by":"xiaomi","source":"official","last_updated":"2026-05-29","description":"MiMo-V2-Pro is Xiaomi's flagship foundation model, featuring over 1T total parameters and a 1M context length, deeply optimized for agentic scenarios.","context_window":1048576,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true},"pricing":{"input":1,"output":3,"cached_input":0.2},"release_date":"2026-03-18","tagline":"MiMo-V2-Pro is Xiaomi's flagship foundation model, featuring over 1T total parameters and a 1M context length, deeply optimized for agentic scenarios.","tools":["function_calling"],"family":"mimo","model_type":"chat","status":"deprecated","deprecation_date":"2026-05-31","license":"proprietary","parameters":1000,"active_parameters":42,"architecture":"moe","open_weight":false},{"id":"xiaomi/mimo-v2.5-pro","name":"Xiaomi: MiMo-V2.5-Pro","created_by":"xiaomi","source":"official","family":"mimo","description":"MiMo-V2.5-Pro is Xiaomi’s flagship model, delivering strong performance in general agentic capabilities, complex software engineering, and long-horizon tasks, with top rankings on benchmarks such as C","release_date":"2026-04-22","context_window":1048576,"max_output_tokens":131072,"model_type":"chat","tagline":"MiMo-V2.5-Pro is Xiaomi’s flagship model, delivering strong performance in general agentic capabilities, complex software engineering, and long-horizon tasks, with top rankings on benchmarks such as C","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.435,"output":0.87,"cached_input":0.004},"tools":["function_calling"],"last_updated":"2026-05-29"},{"id":"xiaomi/mimo-v2.5","name":"Xiaomi: MiMo-V2.5","created_by":"xiaomi","source":"official","family":"mimo","description":"MiMo-V2.5 is a native omnimodal model by Xiaomi.","release_date":"2026-04-22","context_window":1048576,"max_output_tokens":131072,"model_type":"chat","tagline":"MiMo-V2.5 is a native omnimodal model by Xiaomi.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true,"streaming":true,"vision":true},"modalities":{"input":["text","audio","image","video"],"output":["text"]},"pricing":{"input":0.105,"output":0.28,"cached_input":0.003},"tools":["function_calling"],"last_updated":"2026-06-29"},{"id":"z-ai/glm-4-32b","name":"Z.ai: GLM 4 32B ","created_by":"z-ai","source":"official","last_updated":"2026-03-23","description":"GLM 4 32B is a cost-effective foundation language model.","context_window":128000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true},"pricing":{"input":0.1,"output":0.1},"family":"glm-4","model_type":"chat","parameters":32,"release_date":"2025-07-24","tagline":"GLM 4 32B is a cost-effective foundation language model.","tools":["function_calling"]},{"id":"z-ai/glm-4.5-air:free","name":"Z.ai: GLM 4.5 Air (free)","created_by":"z-ai","source":"official","last_updated":"2026-03-23","description":"GLM-4.5-Air is the lightweight variant of our latest flagship model family, also purpose-built for agent-centric applications.","context_window":131072,"max_output_tokens":96000,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"reasoning":true},"family":"glm-4.5","model_type":"chat","release_date":"2025-07-25","tagline":"GLM-4.5-Air is the lightweight variant of our latest flagship model family, also purpose-built for agent-centric applications.","tools":["function_calling"]},{"id":"z-ai/glm-4.5-air","name":"Z.ai: GLM 4.5 Air","created_by":"z-ai","source":"official","last_updated":"2026-06-18","description":"GLM-4.5-Air is the lightweight variant of our latest flagship model family, also purpose-built for agent-centric applications.","context_window":131072,"max_output_tokens":98304,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.13,"output":0.85,"cached_input":0.025},"family":"glm-4.5","model_type":"chat","release_date":"2025-07-25","tagline":"GLM-4.5-Air is the lightweight variant of our latest flagship model family, also purpose-built for agent-centric applications.","tools":["function_calling"]},{"id":"z-ai/glm-4.5","name":"Z.ai: GLM 4.5","created_by":"z-ai","source":"official","last_updated":"2026-06-20","description":"GLM-4.5 is our latest flagship foundation model, purpose-built for agent-based applications.","context_window":131072,"max_output_tokens":98304,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.6,"output":2.2,"cached_input":0.11},"family":"glm-4.5","model_type":"chat","release_date":"2025-07-25","tagline":"GLM-4.5 is our latest flagship foundation model, purpose-built for agent-based applications.","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-12-31"},{"id":"z-ai/glm-4.5v","name":"Z.ai: GLM 4.5V","created_by":"z-ai","source":"official","last_updated":"2026-03-24","description":"GLM-4.5V is a vision-language foundation model for multimodal agent applications.","context_window":65536,"max_output_tokens":16384,"modalities":{"input":["text","image"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.6,"output":1.8,"cached_input":0.11},"family":"glm-4.5","model_type":"chat","release_date":"2025-08-11","tagline":"GLM-4.5V is a vision-language foundation model for multimodal agent applications.","tools":["function_calling"]},{"id":"z-ai/glm-4.6","name":"Z.ai: GLM 4.6","created_by":"z-ai","source":"official","last_updated":"2026-05-14","description":"Compared with GLM-4.5, this generation brings several key improvements: Longer context window: The context window has been expanded from 128K to 200K tokens, enabling the model to handle more complex.","context_window":202752,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.43,"output":1.74,"cached_input":0.08},"family":"glm-4.6","model_type":"chat","release_date":"2025-09-30","tagline":"Compared with GLM-4.5, this generation brings several key improvements:\n\nLonger context window: The context window has been expanded from 128K to 200K tokens, enabling the model to handle more complex","tools":["function_calling"],"status":"deprecated","deprecation_date":"2026-05-14"},{"id":"z-ai/glm-4.6v","name":"Z.ai: GLM 4.6V","created_by":"z-ai","source":"official","last_updated":"2026-06-10","description":"GLM-4.6V is a large multimodal model designed for high-fidelity visual understanding and long-context reasoning across images, documents, and mixed media.","context_window":131072,"max_output_tokens":32768,"modalities":{"input":["image","text","video"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.3,"output":0.9,"cached_input":0.055},"family":"glm-4.6","model_type":"chat","release_date":"2025-12-08","tagline":"GLM-4.6V is a large multimodal model designed for high-fidelity visual understanding and long-context reasoning across images, documents, and mixed media.","tools":["function_calling"]},{"id":"z-ai/glm-4.7-flash","name":"Z.ai: GLM 4.7 Flash","created_by":"z-ai","source":"official","last_updated":"2026-04-25","description":"As a 30B-class SOTA model, GLM-4.7-Flash offers a new option that balances performance and efficiency.","context_window":202752,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.06,"output":0.4,"cached_input":0.01},"family":"glm-4.7","model_type":"chat","release_date":"2026-01-19","tagline":"As a 30B-class SOTA model, GLM-4.7-Flash offers a new option that balances performance and efficiency.","tools":["function_calling"],"max_output_tokens":16384},{"id":"z-ai/glm-4.7","name":"Z.ai: GLM 4.7","created_by":"z-ai","source":"official","last_updated":"2026-05-10","description":"GLM-4.7 is Z.ai’s latest flagship model, featuring upgrades in two key areas: enhanced programming capabilities and more stable multi-step reasoning/execution.","context_window":202752,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.4,"output":1.75,"cached_input":0.08},"family":"glm-4.7","model_type":"chat","release_date":"2025-12-22","tagline":"GLM-4.7 is Z.ai’s latest flagship model, featuring upgrades in two key areas: enhanced programming capabilities and more stable multi-step reasoning/execution.","tools":["function_calling"]},{"id":"z-ai/glm-5-turbo","name":"Z.ai: GLM 5 Turbo","created_by":"z-ai","source":"official","last_updated":"2026-06-10","description":"GLM-5 Turbo is a new model from Z.ai designed for fast inference and strong performance in agent-driven environments such as OpenClaw scenarios.","context_window":262144,"max_output_tokens":131072,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":1.2,"output":4,"cached_input":0.24},"family":"glm-5","model_type":"chat","release_date":"2026-03-15","tagline":"GLM-5 Turbo is a new model from Z.ai designed for fast inference and strong performance in agent-driven environments such as OpenClaw scenarios.","tools":["function_calling"]},{"id":"z-ai/glm-5.1","name":"Z.ai: GLM 5.1","created_by":"z-ai","source":"official","family":"glm-5.1","description":"GLM-5.1 delivers a major leap in coding capability, with particularly significant gains in handling long-horizon tasks.","release_date":"2026-04-07","context_window":202752,"model_type":"chat","tagline":"GLM-5.1 delivers a major leap in coding capability, with particularly significant gains in handling long-horizon tasks.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.975,"output":4.3,"cached_input":0.182},"tools":["function_calling"],"last_updated":"2026-06-30","max_output_tokens":131072},{"id":"z-ai/glm-5.2","name":"Z.ai: GLM 5.2","created_by":"z-ai","source":"official","family":"glm-5.2","description":"GLM 5.2 is a large-scale reasoning model from Z.ai.","release_date":"2026-06-16","context_window":1048576,"max_output_tokens":32768,"model_type":"chat","tagline":"GLM 5.2 is a large-scale reasoning model from Z.ai.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.94,"output":3,"cached_input":0.18},"tools":["function_calling"],"last_updated":"2026-06-30"},{"id":"z-ai/glm-5","name":"Z.ai: GLM 5","created_by":"z-ai","source":"official","last_updated":"2026-06-03","description":"GLM-5 is Z.ai’s flagship open-source foundation model engineered for complex systems design and long-horizon agent workflows.","context_window":202752,"max_output_tokens":16384,"modalities":{"input":["text"],"output":["text"]},"capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"pricing":{"input":0.6,"output":1.92,"cached_input":0.12},"family":"glm-5","model_type":"chat","release_date":"2026-02-11","tagline":"GLM-5 is Z.ai’s flagship open-source foundation model engineered for complex systems design and long-horizon agent workflows.","tools":["function_calling"]},{"id":"z-ai/glm-5v-turbo","name":"Z.ai: GLM 5V Turbo","created_by":"z-ai","source":"official","family":"glm-5","description":"GLM-5V-Turbo is Z.ai’s first native multimodal agent foundation model, built for vision-based coding and agent-driven tasks.","release_date":"2026-04-01","context_window":202752,"max_output_tokens":131072,"model_type":"chat","tagline":"GLM-5V-Turbo is Z.ai’s first native multimodal agent foundation model, built for vision-based coding and agent-driven tasks.","capabilities":{"tool_call":true,"structured_output":true,"reasoning":true,"json_mode":true},"modalities":{"input":["image","text","video"],"output":["text"]},"pricing":{"input":1.2,"output":4,"cached_input":0.24},"tools":["function_calling"],"last_updated":"2026-06-29","status":"deprecated","deprecation_date":"2098-12-31"}]}; export const models: Model[] = provider.models.map((m) => ({ ...m, provider: provider.id })); diff --git a/packages/npm/src/providers/stability.ts b/packages/npm/src/providers/stability.ts index 0e3bcf321..ccc6befbd 100644 --- a/packages/npm/src/providers/stability.ts +++ b/packages/npm/src/providers/stability.ts @@ -3,6 +3,6 @@ import type { ProviderWithModels, Model } from '../types'; -export const provider: ProviderWithModels = {"id":"stability","name":"Stability AI","region":"GB","headquarters":"London, United Kingdom","founded":2019,"url":"https://stability.ai","api_url":"https://api.stability.ai","docs_url":"https://platform.stability.ai/docs","pricing_url":"https://platform.stability.ai/pricing","description":"AI company behind Stable Diffusion, Stable Video, Stable Audio, and related open and hosted generative models.","type":"direct","models_url":"https://huggingface.co/stabilityai","openai_compatible":false,"free_tier":false,"github_url":"https://github.com/Stability-AI","twitter_url":"https://x.com/StabilityAI","icon":"\n \n","models":[{"id":"ar-stablelm-2-base","name":"Ar Stablelm 2 Base","created_by":"stability","source":"official","description":"Ar Stablelm 2 Base is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-07-29","model_type":"chat","license":"other","page_url":"https://huggingface.co/stabilityai/ar-stablelm-2-base","open_weight":true,"tagline":"Ar Stablelm 2 Base is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":2,"last_modified":"2024-12-06","last_updated":"2026-06-03"},{"id":"ar-stablelm-2-chat-gguf","name":"Ar Stablelm 2 Chat Gguf","created_by":"stability","source":"official","description":"Ar Stablelm 2 Chat Gguf is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-08-09","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/ar-stablelm-2-chat-gguf","open_weight":true,"tagline":"Ar Stablelm 2 Chat Gguf is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":6,"last_modified":"2024-12-20","last_updated":"2026-06-03"},{"id":"ar-stablelm-2-chat","name":"Ar Stablelm 2 Chat","created_by":"stability","source":"official","description":"Ar Stablelm 2 Chat is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-08-06","model_type":"code","license":"other","page_url":"https://huggingface.co/stabilityai/ar-stablelm-2-chat","open_weight":true,"tagline":"Ar Stablelm 2 Chat is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":7,"last_modified":"2024-12-06","last_updated":"2026-06-29"},{"id":"arcade100k","name":"Arcade100k","created_by":"stability","source":"official","description":"Arcade100k is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-27","model_type":"other","page_url":"https://huggingface.co/stabilityai/arcade100k","open_weight":true,"tagline":"Arcade100k is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":0,"last_modified":"2024-04-12","last_updated":"2026-05-11"},{"id":"codellama13b_instruct_260k_synthesis","name":"Codellama13b Instruct 260k Synthesis","created_by":"stability","source":"official","family":"codellama","description":"Codellama13b Instruct 260k Synthesis is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-08","model_type":"chat","page_url":"https://huggingface.co/stabilityai/codellama13b_instruct_260k_synthesis","open_weight":true,"tagline":"Codellama13b Instruct 260k Synthesis is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":38,"last_modified":"2023-11-08","last_updated":"2026-06-20"},{"id":"control-lora","name":"Control Lora","created_by":"stability","source":"official","description":"Control Lora is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-17","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/control-lora","open_weight":true,"tagline":"Control Lora is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":0,"last_modified":"2023-08-19","last_updated":"2026-05-11"},{"id":"cosxl","name":"Cosxl","created_by":"stability","source":"official","description":"Cosxl is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-04-08","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/cosxl","open_weight":true,"tagline":"Cosxl is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":0,"last_modified":"2024-04-13","last_updated":"2026-05-11"},{"id":"japanese-instructblip-alpha","name":"Japanese Instructblip Alpha","created_by":"stability","source":"official","description":"Japanese Instructblip Alpha is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-15","model_type":"code","license":"other","page_url":"https://huggingface.co/stabilityai/japanese-instructblip-alpha","open_weight":true,"tagline":"Japanese Instructblip Alpha is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":59,"last_modified":"2023-11-17","last_updated":"2026-06-29"},{"id":"japanese-stable-clip-vit-l-16","name":"Japanese Stable Clip Vit L 16","created_by":"stability","source":"official","description":"Japanese Stable Clip Vit L 16 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-01","model_type":"code","license":"other","page_url":"https://huggingface.co/stabilityai/japanese-stable-clip-vit-l-16","open_weight":true,"tagline":"Japanese Stable Clip Vit L 16 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":1660,"last_modified":"2024-07-10","last_updated":"2026-06-29"},{"id":"japanese-stable-diffusion-xl","name":"Japanese Stable Diffusion Xl","created_by":"stability","source":"official","description":"Japanese Stable Diffusion Xl is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-01","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/japanese-stable-diffusion-xl","open_weight":true,"tagline":"Japanese Stable Diffusion Xl is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":45,"last_modified":"2024-07-10","last_updated":"2026-06-29"},{"id":"japanese-stable-vlm","name":"Japanese Stable Vlm","created_by":"stability","source":"official","description":"Japanese Stable Vlm is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-01","model_type":"code","license":"other","page_url":"https://huggingface.co/stabilityai/japanese-stable-vlm","open_weight":true,"tagline":"Japanese Stable Vlm is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":13,"last_modified":"2024-07-10","last_updated":"2026-06-29"},{"id":"japanese-stablelm-2-base-1_6b","name":"Japanese Stablelm 2 Base 1 6b","created_by":"stability","source":"official","description":"Japanese Stablelm 2 Base 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-05-02","model_type":"chat","license":"other","parameters":6,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-2-base-1_6b","open_weight":true,"tagline":"Japanese Stablelm 2 Base 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":3,"last_modified":"2024-05-02","last_updated":"2026-06-03"},{"id":"japanese-stablelm-2-instruct-1_6b","name":"Japanese Stablelm 2 Instruct 1 6b","created_by":"stability","source":"official","description":"Japanese Stablelm 2 Instruct 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-05-02","model_type":"chat","license":"other","parameters":6,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-2-instruct-1_6b","open_weight":true,"tagline":"Japanese Stablelm 2 Instruct 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":68,"last_modified":"2024-07-10","last_updated":"2026-06-03"},{"id":"japanese-stablelm-3b-4e1t-base","name":"Japanese Stablelm 3b 4e1t Base","created_by":"stability","source":"official","description":"Japanese Stablelm 3b 4e1t Base is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-16","model_type":"chat","license":"apache-2.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-3b-4e1t-base","open_weight":true,"tagline":"Japanese Stablelm 3b 4e1t Base is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":48,"last_modified":"2024-04-26","last_updated":"2026-06-29"},{"id":"japanese-stablelm-3b-4e1t-instruct","name":"Japanese Stablelm 3b 4e1t Instruct","created_by":"stability","source":"official","description":"Japanese Stablelm 3b 4e1t Instruct is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-16","model_type":"chat","license":"apache-2.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-3b-4e1t-instruct","open_weight":true,"tagline":"Japanese Stablelm 3b 4e1t Instruct is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":148,"last_modified":"2024-04-26","last_updated":"2026-06-29"},{"id":"japanese-stablelm-base-alpha-7b","name":"Japanese Stablelm Base Alpha 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Base Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-09","model_type":"chat","license":"apache-2.0","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-base-alpha-7b","open_weight":true,"tagline":"Japanese Stablelm Base Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":330,"last_modified":"2023-08-22","last_updated":"2026-06-29"},{"id":"japanese-stablelm-base-beta-70b","name":"Japanese Stablelm Base Beta 70b","created_by":"stability","source":"official","description":"Japanese Stablelm Base Beta 70b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-30","model_type":"chat","license":"llama2","parameters":70,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-base-beta-70b","open_weight":true,"tagline":"Japanese Stablelm Base Beta 70b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":127,"last_modified":"2023-12-19","last_updated":"2026-06-29"},{"id":"japanese-stablelm-base-beta-7b","name":"Japanese Stablelm Base Beta 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Base Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-30","model_type":"chat","license":"llama2","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-base-beta-7b","open_weight":true,"tagline":"Japanese Stablelm Base Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":50,"last_modified":"2023-12-19","last_updated":"2026-06-29"},{"id":"japanese-stablelm-base-gamma-7b","name":"Japanese Stablelm Base Gamma 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Base Gamma 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-16","model_type":"chat","license":"apache-2.0","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-base-gamma-7b","open_weight":true,"tagline":"Japanese Stablelm Base Gamma 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":141,"last_modified":"2024-01-25","last_updated":"2026-06-29"},{"id":"japanese-stablelm-base-ja_vocab-beta-7b","name":"Japanese Stablelm Base Ja Vocab Beta 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Base Ja Vocab Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-30","model_type":"chat","license":"llama2","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-base-ja_vocab-beta-7b","open_weight":true,"tagline":"Japanese Stablelm Base Ja Vocab Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":40,"last_modified":"2023-12-19","last_updated":"2026-06-29"},{"id":"japanese-stablelm-instruct-alpha-7b-v2","name":"Japanese Stablelm Instruct Alpha 7b V2","created_by":"stability","source":"official","description":"Japanese Stablelm Instruct Alpha 7b V2 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-09-26","model_type":"chat","license":"apache-2.0","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-instruct-alpha-7b-v2","open_weight":true,"tagline":"Japanese Stablelm Instruct Alpha 7b V2 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":40,"last_modified":"2023-10-06","last_updated":"2026-06-29"},{"id":"japanese-stablelm-instruct-alpha-7b","name":"Japanese Stablelm Instruct Alpha 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Instruct Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-10","model_type":"chat","license":"other","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-instruct-alpha-7b","open_weight":true,"tagline":"Japanese Stablelm Instruct Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":0,"last_modified":"2023-08-22","last_updated":"2026-05-11"},{"id":"japanese-stablelm-instruct-beta-70b","name":"Japanese Stablelm Instruct Beta 70b","created_by":"stability","source":"official","description":"Japanese Stablelm Instruct Beta 70b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-30","model_type":"chat","license":"llama2","parameters":70,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-instruct-beta-70b","open_weight":true,"tagline":"Japanese Stablelm Instruct Beta 70b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":131,"last_modified":"2023-12-19","last_updated":"2026-06-29"},{"id":"japanese-stablelm-instruct-beta-7b","name":"Japanese Stablelm Instruct Beta 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Instruct Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-30","model_type":"chat","license":"llama2","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-instruct-beta-7b","open_weight":true,"tagline":"Japanese Stablelm Instruct Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":58,"last_modified":"2023-12-19","last_updated":"2026-06-29"},{"id":"japanese-stablelm-instruct-gamma-7b","name":"Japanese Stablelm Instruct Gamma 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Instruct Gamma 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-16","model_type":"chat","license":"apache-2.0","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-instruct-gamma-7b","open_weight":true,"tagline":"Japanese Stablelm Instruct Gamma 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":151,"last_modified":"2024-01-24","last_updated":"2026-06-29"},{"id":"japanese-stablelm-instruct-ja_vocab-beta-7b","name":"Japanese Stablelm Instruct Ja Vocab Beta 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Instruct Ja Vocab Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-30","model_type":"chat","license":"llama2","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-instruct-ja_vocab-beta-7b","open_weight":true,"tagline":"Japanese Stablelm Instruct Ja Vocab Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":45,"last_modified":"2023-12-19","last_updated":"2026-06-29"},{"id":"SAME-L","name":"SAME L","created_by":"stability","source":"official","description":"SAME L is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-17","model_type":"code","license":"other","page_url":"https://huggingface.co/stabilityai/SAME-L","open_weight":true,"tagline":"SAME L is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":6323,"last_modified":"2026-06-24","last_updated":"2026-06-29"},{"id":"SAME-S","name":"SAME S","created_by":"stability","source":"official","description":"SAME S is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-17","model_type":"code","license":"other","page_url":"https://huggingface.co/stabilityai/SAME-S","open_weight":true,"tagline":"SAME S is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":1549,"last_modified":"2026-05-19","last_updated":"2026-06-29"},{"id":"sd-turbo","name":"Sd Turbo","created_by":"stability","source":"official","description":"Sd Turbo is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-27","model_type":"image","page_url":"https://huggingface.co/stabilityai/sd-turbo","open_weight":true,"tagline":"Sd Turbo is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":698263,"last_modified":"2024-07-10","last_updated":"2026-06-29"},{"id":"sd-vae-ft-ema-original","name":"Sd Vae Ft Ema Original","created_by":"stability","source":"official","description":"Sd Vae Ft Ema Original is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2022-10-13","model_type":"image","license":"mit","page_url":"https://huggingface.co/stabilityai/sd-vae-ft-ema-original","open_weight":true,"tagline":"Sd Vae Ft Ema Original is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":0,"last_modified":"2022-12-19","last_updated":"2026-05-11"},{"id":"sd-vae-ft-ema","name":"Sd Vae Ft Ema","created_by":"stability","source":"official","description":"Sd Vae Ft Ema is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2022-10-13","model_type":"other","license":"mit","page_url":"https://huggingface.co/stabilityai/sd-vae-ft-ema","open_weight":true,"tagline":"Sd Vae Ft Ema is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":7037,"last_modified":"2023-06-05","last_updated":"2026-06-29"},{"id":"sd-vae-ft-mse-original","name":"Sd Vae Ft Mse Original","created_by":"stability","source":"official","description":"Sd Vae Ft Mse Original is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2022-10-13","model_type":"image","license":"mit","page_url":"https://huggingface.co/stabilityai/sd-vae-ft-mse-original","open_weight":true,"tagline":"Sd Vae Ft Mse Original is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":1,"last_modified":"2022-12-19","last_updated":"2026-06-29"},{"id":"sd-vae-ft-mse","name":"Sd Vae Ft Mse","created_by":"stability","source":"official","description":"Sd Vae Ft Mse is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2022-10-13","model_type":"other","license":"mit","page_url":"https://huggingface.co/stabilityai/sd-vae-ft-mse","open_weight":true,"tagline":"Sd Vae Ft Mse is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":102468,"last_modified":"2023-06-06","last_updated":"2026-06-29"},{"id":"sd-x2-latent-upscaler","name":"Sd X2 Latent Upscaler","created_by":"stability","source":"official","description":"Sd X2 Latent Upscaler is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-02-03","model_type":"other","license":"openrail++","page_url":"https://huggingface.co/stabilityai/sd-x2-latent-upscaler","open_weight":true,"tagline":"Sd X2 Latent Upscaler is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":130271,"last_modified":"2023-06-05","last_updated":"2026-06-29"},{"id":"sdxl-turbo-ryzen-ai","name":"Sdxl Turbo Ryzen Ai","created_by":"stability","source":"official","description":"Sdxl Turbo Ryzen Ai is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-12-06","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/sdxl-turbo-ryzen-ai","open_weight":true,"tagline":"Sdxl Turbo Ryzen Ai is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":489,"last_modified":"2024-12-11","last_updated":"2026-06-29"},{"id":"sdxl-turbo-tensorrt","name":"Sdxl Turbo Tensorrt","created_by":"stability","source":"official","description":"Sdxl Turbo Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-12-28","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/sdxl-turbo-tensorrt","open_weight":true,"tagline":"Sdxl Turbo Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":29,"last_modified":"2025-10-20","last_updated":"2026-06-29"},{"id":"sdxl-turbo","name":"Sdxl Turbo","created_by":"stability","source":"official","description":"Sdxl Turbo is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-27","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/sdxl-turbo","open_weight":true,"tagline":"Sdxl Turbo is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":609582,"last_modified":"2024-07-10","last_updated":"2026-06-29"},{"id":"sdxl-vae","name":"Sdxl Vae","created_by":"stability","source":"official","description":"Sdxl Vae is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-06-21","model_type":"other","license":"mit","page_url":"https://huggingface.co/stabilityai/sdxl-vae","open_weight":true,"tagline":"Sdxl Vae is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":263433,"last_modified":"2023-08-04","last_updated":"2026-06-29"},{"id":"sp4d","name":"Sp4d","created_by":"stability","source":"official","description":"Sp4d is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-11-03","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/sp4d","open_weight":true,"tagline":"Sp4d is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":15,"last_modified":"2025-11-05","last_updated":"2026-06-29"},{"id":"stable-audio-3-medium-base","name":"Stable Audio 3 Medium Base","created_by":"stability","source":"official","description":"Stable Audio 3 Medium Base is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-17","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-3-medium-base","open_weight":true,"tagline":"Stable Audio 3 Medium Base is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":4312,"last_modified":"2026-06-16","last_updated":"2026-06-29"},{"id":"stable-audio-3-medium","name":"Stable Audio 3 Medium","created_by":"stability","source":"official","description":"Stable Audio 3 Medium is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-17","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-3-medium","open_weight":true,"tagline":"Stable Audio 3 Medium is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":59946,"last_modified":"2026-06-16","last_updated":"2026-06-29"},{"id":"stable-audio-3-small-music-base","name":"Stable Audio 3 Small Music Base","created_by":"stability","source":"official","description":"Stable Audio 3 Small Music Base is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-16","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-3-small-music-base","open_weight":true,"tagline":"Stable Audio 3 Small Music Base is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":1769,"last_modified":"2026-05-20","last_updated":"2026-06-29"},{"id":"stable-audio-3-small-music","name":"Stable Audio 3 Small Music","created_by":"stability","source":"official","description":"Stable Audio 3 Small Music is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-17","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-3-small-music","open_weight":true,"tagline":"Stable Audio 3 Small Music is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":15603,"last_modified":"2026-05-19","last_updated":"2026-06-29"},{"id":"stable-audio-3-small-sfx-base","name":"Stable Audio 3 Small Sfx Base","created_by":"stability","source":"official","description":"Stable Audio 3 Small Sfx Base is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-17","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-3-small-sfx-base","open_weight":true,"tagline":"Stable Audio 3 Small Sfx Base is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":1054,"last_modified":"2026-05-20","last_updated":"2026-06-29"},{"id":"stable-audio-3-small-sfx","name":"Stable Audio 3 Small Sfx","created_by":"stability","source":"official","description":"Stable Audio 3 Small Sfx is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-17","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-3-small-sfx","open_weight":true,"tagline":"Stable Audio 3 Small Sfx is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":12006,"last_modified":"2026-05-19","last_updated":"2026-06-29"},{"id":"stable-audio-open-1.0","name":"Stable Audio Open 1.0","created_by":"stability","source":"official","description":"Stable Audio Open 1.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-05-24","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-open-1.0","open_weight":true,"tagline":"Stable Audio Open 1.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"tool_call":true,"fine_tuning":true},"tools":["function_calling"],"huggingface_downloads":26532,"last_modified":"2025-06-19","last_updated":"2026-06-29"},{"id":"stable-audio-open-small","name":"Stable Audio Open Small","created_by":"stability","source":"official","description":"Stable Audio Open Small is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-05-12","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-open-small","open_weight":true,"tagline":"Stable Audio Open Small is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"tool_call":true,"fine_tuning":true},"tools":["function_calling"],"huggingface_downloads":2235,"last_modified":"2025-05-27","last_updated":"2026-06-29"},{"id":"stable-cascade-prior","name":"Stable Cascade Prior","created_by":"stability","source":"official","description":"Stable Cascade Prior is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-02-12","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-cascade-prior","open_weight":true,"tagline":"Stable Cascade Prior is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":789,"last_modified":"2024-03-14","last_updated":"2026-06-29"},{"id":"stable-cascade","name":"Stable Cascade","created_by":"stability","source":"official","description":"Stable Cascade is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-02-06","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-cascade","open_weight":true,"tagline":"Stable Cascade is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":8252,"last_modified":"2024-03-16","last_updated":"2026-06-29"},{"id":"stable-code-3b","name":"Stable Code 3b","created_by":"stability","source":"official","description":"Stable Code 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-01-09","model_type":"chat","license":"other","parameters":3,"page_url":"https://huggingface.co/stabilityai/stable-code-3b","open_weight":true,"tagline":"Stable Code 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":5918,"last_modified":"2024-07-10","last_updated":"2026-06-29"},{"id":"stable-code-instruct-3b","name":"Stable Code Instruct 3b","created_by":"stability","source":"official","description":"Stable Code Instruct 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-03-06","model_type":"chat","license":"other","parameters":3,"page_url":"https://huggingface.co/stabilityai/stable-code-instruct-3b","open_weight":true,"tagline":"Stable Code Instruct 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":2335,"last_modified":"2024-07-10","last_updated":"2026-06-29"},{"id":"stable-codec-speech-16k-base","name":"Stable Codec Speech 16k Base","created_by":"stability","source":"official","description":"Stable Codec Speech 16k Base is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-01-14","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/stable-codec-speech-16k-base","open_weight":true,"tagline":"Stable Codec Speech 16k Base is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"tool_call":true,"fine_tuning":true},"tools":["function_calling"],"huggingface_downloads":1,"last_modified":"2025-01-14","last_updated":"2026-06-03"},{"id":"stable-codec-speech-16k","name":"Stable Codec Speech 16k","created_by":"stability","source":"official","description":"Stable Codec Speech 16k is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-01-10","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/stable-codec-speech-16k","open_weight":true,"tagline":"Stable Codec Speech 16k is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"tool_call":true,"fine_tuning":true},"tools":["function_calling"],"huggingface_downloads":334,"last_modified":"2025-01-10","last_updated":"2026-06-29"},{"id":"stable-diffusion-3-medium-amdnpu","name":"Stable Diffusion 3 Medium Amdnpu","created_by":"stability","source":"official","description":"Stable Diffusion 3 Medium Amdnpu is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-01","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3-medium-amdnpu","open_weight":true,"tagline":"Stable Diffusion 3 Medium Amdnpu is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":27,"last_modified":"2026-05-05","last_updated":"2026-06-29"},{"id":"stable-diffusion-3-medium-diffusers","name":"Stable Diffusion 3 Medium Diffusers","created_by":"stability","source":"official","description":"Stable Diffusion 3 Medium Diffusers is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-06-12","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3-medium-diffusers","open_weight":true,"tagline":"Stable Diffusion 3 Medium Diffusers is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":33289,"last_modified":"2024-06-19","last_updated":"2026-06-29"},{"id":"stable-diffusion-3-medium-tensorrt","name":"Stable Diffusion 3 Medium Tensorrt","created_by":"stability","source":"official","description":"Stable Diffusion 3 Medium Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-06-12","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3-medium-tensorrt","open_weight":true,"tagline":"Stable Diffusion 3 Medium Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":15,"last_modified":"2025-10-20","last_updated":"2026-06-29"},{"id":"stable-diffusion-3-medium","name":"Stable Diffusion 3 Medium","created_by":"stability","source":"official","description":"Stable Diffusion 3 Medium is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-05-30","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3-medium","open_weight":true,"tagline":"Stable Diffusion 3 Medium is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":3481,"last_modified":"2024-08-12","last_updated":"2026-06-29"},{"id":"stable-diffusion-3-medium_amdgpu","name":"Stable Diffusion 3 Medium Amdgpu","created_by":"stability","source":"official","description":"Stable Diffusion 3 Medium Amdgpu is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-02-28","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3-medium_amdgpu","open_weight":true,"tagline":"Stable Diffusion 3 Medium Amdgpu is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":0,"last_modified":"2025-07-16","last_updated":"2026-05-11"},{"id":"stable-diffusion-3.5-controlnets-tensorrt","name":"Stable Diffusion 3.5 Controlnets Tensorrt","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Controlnets Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-08-07","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-controlnets-tensorrt","open_weight":true,"tagline":"Stable Diffusion 3.5 Controlnets Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":177,"last_modified":"2025-10-20","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-controlnets","name":"Stable Diffusion 3.5 Controlnets","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Controlnets is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-11-15","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-controlnets","open_weight":true,"tagline":"Stable Diffusion 3.5 Controlnets is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":12,"last_modified":"2024-12-11","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-large-controlnet-blur","name":"Stable Diffusion 3.5 Large Controlnet Blur","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Large Controlnet Blur is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-11-25","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-large-controlnet-blur","open_weight":true,"tagline":"Stable Diffusion 3.5 Large Controlnet Blur is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":53,"last_modified":"2024-11-28","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-large-controlnet-canny","name":"Stable Diffusion 3.5 Large Controlnet Canny","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Large Controlnet Canny is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-11-25","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-large-controlnet-canny","open_weight":true,"tagline":"Stable Diffusion 3.5 Large Controlnet Canny is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":21152,"last_modified":"2024-11-28","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-large-controlnet-depth","name":"Stable Diffusion 3.5 Large Controlnet Depth","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Large Controlnet Depth is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-11-25","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-large-controlnet-depth","open_weight":true,"tagline":"Stable Diffusion 3.5 Large Controlnet Depth is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":24549,"last_modified":"2024-11-28","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-large-tensorrt","name":"Stable Diffusion 3.5 Large Tensorrt","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Large Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-05-16","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-large-tensorrt","open_weight":true,"tagline":"Stable Diffusion 3.5 Large Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":1469,"last_modified":"2025-10-20","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-large-turbo","name":"Stable Diffusion 3.5 Large Turbo","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Large Turbo is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-10-22","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-large-turbo","open_weight":true,"tagline":"Stable Diffusion 3.5 Large Turbo is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":6991,"last_modified":"2024-10-22","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-large","name":"Stable Diffusion 3.5 Large","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Large is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-10-22","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-large","open_weight":true,"tagline":"Stable Diffusion 3.5 Large is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":26298,"last_modified":"2024-10-22","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-medium-tensorrt","name":"Stable Diffusion 3.5 Medium Tensorrt","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Medium Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-08-07","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-medium-tensorrt","open_weight":true,"tagline":"Stable Diffusion 3.5 Medium Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":9,"last_modified":"2025-10-20","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-medium","name":"Stable Diffusion 3.5 Medium","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Medium is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-10-29","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-medium","open_weight":true,"tagline":"Stable Diffusion 3.5 Medium is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":612474,"last_modified":"2024-10-31","last_updated":"2026-06-29"},{"id":"stable-diffusion-x4-upscaler","name":"Stable Diffusion X4 Upscaler","created_by":"stability","source":"official","description":"Stable Diffusion X4 Upscaler is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2022-11-23","model_type":"other","license":"openrail++","page_url":"https://huggingface.co/stabilityai/stable-diffusion-x4-upscaler","open_weight":true,"tagline":"Stable Diffusion X4 Upscaler is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":10328,"last_modified":"2023-07-05","last_updated":"2026-06-29"},{"id":"stable-diffusion-xl-1.0-tensorrt","name":"Stable Diffusion Xl 1.0 Tensorrt","created_by":"stability","source":"official","description":"Stable Diffusion Xl 1.0 Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-22","model_type":"image","license":"openrail++","page_url":"https://huggingface.co/stabilityai/stable-diffusion-xl-1.0-tensorrt","open_weight":true,"tagline":"Stable Diffusion Xl 1.0 Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":275,"last_modified":"2025-10-20","last_updated":"2026-06-29"},{"id":"stable-diffusion-xl-base-0.9","name":"Stable Diffusion Xl Base 0.9","created_by":"stability","source":"official","description":"Stable Diffusion Xl Base 0.9 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-06-19","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-xl-base-0.9","open_weight":true,"tagline":"Stable Diffusion Xl Base 0.9 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":48,"last_modified":"2023-07-12","last_updated":"2026-06-29"},{"id":"stable-diffusion-xl-base-1.0","name":"Stable Diffusion Xl Base 1.0","created_by":"stability","source":"official","description":"Stable Diffusion Xl Base 1.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-07-25","model_type":"image","license":"openrail++","page_url":"https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0","open_weight":true,"tagline":"Stable Diffusion Xl Base 1.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":1324082,"last_modified":"2023-10-30","last_updated":"2026-06-29"},{"id":"stable-diffusion-xl-refiner-0.9","name":"Stable Diffusion Xl Refiner 0.9","created_by":"stability","source":"official","description":"Stable Diffusion Xl Refiner 0.9 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-06-21","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-xl-refiner-0.9","open_weight":true,"tagline":"Stable Diffusion Xl Refiner 0.9 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":45,"last_modified":"2023-07-12","last_updated":"2026-06-29"},{"id":"stable-diffusion-xl-refiner-1.0","name":"Stable Diffusion Xl Refiner 1.0","created_by":"stability","source":"official","description":"Stable Diffusion Xl Refiner 1.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-07-26","model_type":"image","license":"openrail++","page_url":"https://huggingface.co/stabilityai/stable-diffusion-xl-refiner-1.0","open_weight":true,"tagline":"Stable Diffusion Xl Refiner 1.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":163793,"last_modified":"2023-09-25","last_updated":"2026-06-29"},{"id":"stable-fast-3d","name":"Stable Fast 3d","created_by":"stability","source":"official","description":"Stable Fast 3d is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-07-17","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/stable-fast-3d","open_weight":true,"tagline":"Stable Fast 3d is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"huggingface_downloads":11960,"last_modified":"2025-04-08","last_updated":"2026-06-29"},{"id":"stable-point-aware-3d","name":"Stable Point Aware 3d","created_by":"stability","source":"official","description":"Stable Point Aware 3d is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-12-28","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/stable-point-aware-3d","open_weight":true,"tagline":"Stable Point Aware 3d is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"huggingface_downloads":2132,"last_modified":"2025-04-08","last_updated":"2026-06-29"},{"id":"stable-video-diffusion-img2vid-xt-1-1-tensorrt","name":"Stable Video Diffusion Img2vid Xt 1 1 Tensorrt","created_by":"stability","source":"official","description":"Stable Video Diffusion Img2vid Xt 1 1 Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-03-07","model_type":"video","license":"other","page_url":"https://huggingface.co/stabilityai/stable-video-diffusion-img2vid-xt-1-1-tensorrt","open_weight":true,"tagline":"Stable Video Diffusion Img2vid Xt 1 1 Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"huggingface_downloads":20,"last_modified":"2025-10-20","last_updated":"2026-06-29"},{"id":"stable-video-diffusion-img2vid-xt-1-1","name":"Stable Video Diffusion Img2vid Xt 1 1","created_by":"stability","source":"official","description":"Stable Video Diffusion Img2vid Xt 1 1 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-02-02","model_type":"video","license":"other","page_url":"https://huggingface.co/stabilityai/stable-video-diffusion-img2vid-xt-1-1","open_weight":true,"tagline":"Stable Video Diffusion Img2vid Xt 1 1 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"huggingface_downloads":7772,"last_modified":"2024-07-10","last_updated":"2026-06-29"},{"id":"stable-video-diffusion-img2vid-xt","name":"Stable Video Diffusion Img2vid Xt","created_by":"stability","source":"official","description":"Stable Video Diffusion Img2vid Xt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-20","model_type":"video","license":"other","page_url":"https://huggingface.co/stabilityai/stable-video-diffusion-img2vid-xt","open_weight":true,"tagline":"Stable Video Diffusion Img2vid Xt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"huggingface_downloads":218304,"last_modified":"2024-07-10","last_updated":"2026-06-29"},{"id":"stable-video-diffusion-img2vid","name":"Stable Video Diffusion Img2vid","created_by":"stability","source":"official","description":"Stable Video Diffusion Img2vid is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-20","model_type":"video","license":"other","page_url":"https://huggingface.co/stabilityai/stable-video-diffusion-img2vid","open_weight":true,"tagline":"Stable Video Diffusion Img2vid is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"huggingface_downloads":32007,"last_modified":"2024-07-10","last_updated":"2026-06-29"},{"id":"stable-virtual-camera","name":"Stable Virtual Camera","created_by":"stability","source":"official","description":"Stable Virtual Camera is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-02-19","model_type":"video","license":"other","page_url":"https://huggingface.co/stabilityai/stable-virtual-camera","open_weight":true,"tagline":"Stable Virtual Camera is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"huggingface_downloads":9634,"last_modified":"2025-06-03","last_updated":"2026-06-29"},{"id":"stable-zero123","name":"Stable Zero123","created_by":"stability","source":"official","description":"Stable Zero123 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-12-08","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/stable-zero123","open_weight":true,"tagline":"Stable Zero123 is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":0,"last_modified":"2024-07-10","last_updated":"2026-05-11"},{"id":"StableBeluga-13B","name":"StableBeluga 13B","created_by":"stability","source":"official","description":"StableBeluga 13B is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-07-27","model_type":"chat","parameters":13,"page_url":"https://huggingface.co/stabilityai/StableBeluga-13B","open_weight":true,"tagline":"StableBeluga 13B is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":260,"last_modified":"2023-08-29","last_updated":"2026-06-29"},{"id":"StableBeluga-7B","name":"StableBeluga 7B","created_by":"stability","source":"official","description":"StableBeluga 7B is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-07-27","model_type":"chat","parameters":7,"page_url":"https://huggingface.co/stabilityai/StableBeluga-7B","open_weight":true,"tagline":"StableBeluga 7B is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":251,"last_modified":"2023-08-29","last_updated":"2026-06-29"},{"id":"StableBeluga1-Delta","name":"StableBeluga1 Delta","created_by":"stability","source":"official","description":"StableBeluga1 Delta is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-07-20","model_type":"chat","license":"cc-by-nc-4.0","page_url":"https://huggingface.co/stabilityai/StableBeluga1-Delta","open_weight":true,"tagline":"StableBeluga1 Delta is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":145,"last_modified":"2023-07-27","last_updated":"2026-06-29"},{"id":"StableBeluga2","name":"StableBeluga2","created_by":"stability","source":"official","description":"StableBeluga2 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-07-20","model_type":"chat","page_url":"https://huggingface.co/stabilityai/StableBeluga2","open_weight":true,"tagline":"StableBeluga2 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":717,"last_modified":"2023-09-18","last_updated":"2026-06-29"},{"id":"stablecode-completion-alpha-3b-4k","name":"Stablecode Completion Alpha 3b 4k","created_by":"stability","source":"official","description":"Stablecode Completion Alpha 3b 4k is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-07","model_type":"chat","license":"apache-2.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablecode-completion-alpha-3b-4k","open_weight":true,"tagline":"Stablecode Completion Alpha 3b 4k is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":1115,"last_modified":"2023-08-08","last_updated":"2026-06-29"},{"id":"stablecode-completion-alpha-3b","name":"Stablecode Completion Alpha 3b","created_by":"stability","source":"official","description":"Stablecode Completion Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-07-31","model_type":"chat","license":"apache-2.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablecode-completion-alpha-3b","open_weight":true,"tagline":"Stablecode Completion Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":408,"last_modified":"2023-08-08","last_updated":"2026-06-29"},{"id":"stablecode-instruct-alpha-3b","name":"Stablecode Instruct Alpha 3b","created_by":"stability","source":"official","description":"Stablecode Instruct Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-07","model_type":"chat","license":"other","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablecode-instruct-alpha-3b","open_weight":true,"tagline":"Stablecode Instruct Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":4,"last_modified":"2023-08-08","last_updated":"2026-06-29"},{"id":"stablelm-2-12b-chat-GGUF","name":"Stablelm 2 12b Chat GGUF","created_by":"stability","source":"official","description":"Stablelm 2 12b Chat GGUF is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-04-17","model_type":"chat","license":"other","parameters":12,"page_url":"https://huggingface.co/stabilityai/stablelm-2-12b-chat-GGUF","open_weight":true,"tagline":"Stablelm 2 12b Chat GGUF is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"tool_call":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"tools":["function_calling"],"huggingface_downloads":168,"last_modified":"2024-04-20","last_updated":"2026-06-29"},{"id":"stablelm-2-12b-chat","name":"Stablelm 2 12b Chat","created_by":"stability","source":"official","description":"Stablelm 2 12b Chat is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-04-04","model_type":"chat","license":"other","parameters":12,"page_url":"https://huggingface.co/stabilityai/stablelm-2-12b-chat","open_weight":true,"tagline":"Stablelm 2 12b Chat is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"tool_call":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"tools":["function_calling"],"huggingface_downloads":266,"last_modified":"2024-05-20","last_updated":"2026-06-29"},{"id":"stablelm-2-12b","name":"Stablelm 2 12b","created_by":"stability","source":"official","description":"Stablelm 2 12b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-03-21","model_type":"chat","license":"other","parameters":12,"page_url":"https://huggingface.co/stabilityai/stablelm-2-12b","open_weight":true,"tagline":"Stablelm 2 12b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":3144,"last_modified":"2024-07-10","last_updated":"2026-06-29"},{"id":"stablelm-2-1_6b-chat","name":"Stablelm 2 1 6b Chat","created_by":"stability","source":"official","description":"Stablelm 2 1 6b Chat is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-04-08","model_type":"chat","license":"other","parameters":6,"page_url":"https://huggingface.co/stabilityai/stablelm-2-1_6b-chat","open_weight":true,"tagline":"Stablelm 2 1 6b Chat is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":843,"last_modified":"2024-06-03","last_updated":"2026-06-29"},{"id":"stablelm-2-1_6b","name":"Stablelm 2 1 6b","created_by":"stability","source":"official","description":"Stablelm 2 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-01-18","model_type":"chat","license":"other","parameters":6,"page_url":"https://huggingface.co/stabilityai/stablelm-2-1_6b","open_weight":true,"tagline":"Stablelm 2 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":10285,"last_modified":"2024-07-10","last_updated":"2026-06-29"},{"id":"stablelm-2-zephyr-1_6b","name":"Stablelm 2 Zephyr 1 6b","created_by":"stability","source":"official","description":"Stablelm 2 Zephyr 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-01-19","model_type":"chat","license":"other","parameters":6,"page_url":"https://huggingface.co/stabilityai/stablelm-2-zephyr-1_6b","open_weight":true,"tagline":"Stablelm 2 Zephyr 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":3318,"last_modified":"2024-06-03","last_updated":"2026-06-29"},{"id":"stablelm-3b-4e1t","name":"Stablelm 3b 4e1t","created_by":"stability","source":"official","description":"Stablelm 3b 4e1t is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-09-29","model_type":"chat","license":"cc-by-sa-4.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablelm-3b-4e1t","open_weight":true,"tagline":"Stablelm 3b 4e1t is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":93520,"last_modified":"2024-03-07","last_updated":"2026-06-29"},{"id":"stablelm-base-alpha-3b-v2","name":"Stablelm Base Alpha 3b V2","created_by":"stability","source":"official","description":"Stablelm Base Alpha 3b V2 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-04","model_type":"chat","license":"cc-by-sa-4.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablelm-base-alpha-3b-v2","open_weight":true,"tagline":"Stablelm Base Alpha 3b V2 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":531,"last_modified":"2023-09-11","last_updated":"2026-06-29"},{"id":"stablelm-base-alpha-3b","name":"Stablelm Base Alpha 3b","created_by":"stability","source":"official","description":"Stablelm Base Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-04-17","model_type":"chat","license":"cc-by-sa-4.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablelm-base-alpha-3b","open_weight":true,"tagline":"Stablelm Base Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":3011,"last_modified":"2023-10-19","last_updated":"2026-06-29"},{"id":"stablelm-base-alpha-7b-v2","name":"Stablelm Base Alpha 7b V2","created_by":"stability","source":"official","description":"Stablelm Base Alpha 7b V2 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-04","model_type":"chat","license":"cc-by-sa-4.0","parameters":7,"page_url":"https://huggingface.co/stabilityai/stablelm-base-alpha-7b-v2","open_weight":true,"tagline":"Stablelm Base Alpha 7b V2 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":457,"last_modified":"2023-09-11","last_updated":"2026-06-29"},{"id":"stablelm-base-alpha-7b","name":"Stablelm Base Alpha 7b","created_by":"stability","source":"official","description":"Stablelm Base Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-04-11","model_type":"chat","license":"cc-by-sa-4.0","parameters":7,"page_url":"https://huggingface.co/stabilityai/stablelm-base-alpha-7b","open_weight":true,"tagline":"Stablelm Base Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":999,"last_modified":"2023-10-19","last_updated":"2026-06-29"},{"id":"stablelm-tuned-alpha-3b","name":"Stablelm Tuned Alpha 3b","created_by":"stability","source":"official","description":"Stablelm Tuned Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-04-19","model_type":"chat","license":"cc-by-nc-sa-4.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablelm-tuned-alpha-3b","open_weight":true,"tagline":"Stablelm Tuned Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":845,"last_modified":"2023-04-19","last_updated":"2026-06-29"},{"id":"stablelm-tuned-alpha-7b","name":"Stablelm Tuned Alpha 7b","created_by":"stability","source":"official","description":"Stablelm Tuned Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-04-19","model_type":"chat","license":"cc-by-nc-sa-4.0","parameters":7,"page_url":"https://huggingface.co/stabilityai/stablelm-tuned-alpha-7b","open_weight":true,"tagline":"Stablelm Tuned Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":5838,"last_modified":"2023-04-19","last_updated":"2026-06-29"},{"id":"stablelm-zephyr-3b","name":"Stablelm Zephyr 3b","created_by":"stability","source":"official","description":"Stablelm Zephyr 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-21","model_type":"chat","license":"other","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablelm-zephyr-3b","open_weight":true,"tagline":"Stablelm Zephyr 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":28453,"last_modified":"2024-07-10","last_updated":"2026-06-29"},{"id":"sv3d","name":"Sv3d","created_by":"stability","source":"official","description":"Sv3d is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-03-18","model_type":"video","license":"other","page_url":"https://huggingface.co/stabilityai/sv3d","open_weight":true,"tagline":"Sv3d is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"huggingface_downloads":0,"last_modified":"2024-07-10","last_updated":"2026-05-11"},{"id":"sv4d","name":"Sv4d","created_by":"stability","source":"official","description":"Sv4d is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-07-16","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/sv4d","open_weight":true,"tagline":"Sv4d is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":27,"last_modified":"2024-08-03","last_updated":"2026-06-29"},{"id":"sv4d2.0","name":"Sv4d2.0","created_by":"stability","source":"official","description":"Sv4d2.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-02-20","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/sv4d2.0","open_weight":true,"tagline":"Sv4d2.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":365,"last_modified":"2025-04-04","last_updated":"2026-06-29"},{"id":"tiny-random-stablelm-2","name":"Tiny Random Stablelm 2","created_by":"stability","source":"official","description":"Tiny Random Stablelm 2 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-03-20","model_type":"chat","page_url":"https://huggingface.co/stabilityai/tiny-random-stablelm-2","open_weight":true,"tagline":"Tiny Random Stablelm 2 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":1405,"last_modified":"2024-03-31","last_updated":"2026-06-29"},{"id":"TripoSR","name":"TripoSR","created_by":"stability","source":"official","description":"TripoSR is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-02-29","model_type":"other","license":"mit","page_url":"https://huggingface.co/stabilityai/TripoSR","open_weight":true,"tagline":"TripoSR is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"huggingface_downloads":189582,"last_modified":"2024-08-09","last_updated":"2026-06-29"}]}; +export const provider: ProviderWithModels = {"id":"stability","name":"Stability AI","region":"GB","headquarters":"London, United Kingdom","founded":2019,"url":"https://stability.ai","api_url":"https://api.stability.ai","docs_url":"https://platform.stability.ai/docs","pricing_url":"https://platform.stability.ai/pricing","description":"AI company behind Stable Diffusion, Stable Video, Stable Audio, and related open and hosted generative models.","type":"direct","models_url":"https://huggingface.co/stabilityai","openai_compatible":false,"free_tier":false,"github_url":"https://github.com/Stability-AI","twitter_url":"https://x.com/StabilityAI","icon":"\n \n","models":[{"id":"ar-stablelm-2-base","name":"Ar Stablelm 2 Base","created_by":"stability","source":"official","description":"Ar Stablelm 2 Base is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-07-29","model_type":"chat","license":"other","page_url":"https://huggingface.co/stabilityai/ar-stablelm-2-base","open_weight":true,"tagline":"Ar Stablelm 2 Base is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":2,"last_modified":"2024-12-06","last_updated":"2026-06-03"},{"id":"ar-stablelm-2-chat-gguf","name":"Ar Stablelm 2 Chat Gguf","created_by":"stability","source":"official","description":"Ar Stablelm 2 Chat Gguf is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-08-09","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/ar-stablelm-2-chat-gguf","open_weight":true,"tagline":"Ar Stablelm 2 Chat Gguf is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":6,"last_modified":"2024-12-20","last_updated":"2026-06-03"},{"id":"ar-stablelm-2-chat","name":"Ar Stablelm 2 Chat","created_by":"stability","source":"official","description":"Ar Stablelm 2 Chat is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-08-06","model_type":"code","license":"other","page_url":"https://huggingface.co/stabilityai/ar-stablelm-2-chat","open_weight":true,"tagline":"Ar Stablelm 2 Chat is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":10,"last_modified":"2024-12-06","last_updated":"2026-06-30"},{"id":"arcade100k","name":"Arcade100k","created_by":"stability","source":"official","description":"Arcade100k is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-27","model_type":"other","page_url":"https://huggingface.co/stabilityai/arcade100k","open_weight":true,"tagline":"Arcade100k is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":0,"last_modified":"2024-04-12","last_updated":"2026-05-11"},{"id":"codellama13b_instruct_260k_synthesis","name":"Codellama13b Instruct 260k Synthesis","created_by":"stability","source":"official","family":"codellama","description":"Codellama13b Instruct 260k Synthesis is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-08","model_type":"chat","page_url":"https://huggingface.co/stabilityai/codellama13b_instruct_260k_synthesis","open_weight":true,"tagline":"Codellama13b Instruct 260k Synthesis is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":36,"last_modified":"2023-11-08","last_updated":"2026-06-30"},{"id":"control-lora","name":"Control Lora","created_by":"stability","source":"official","description":"Control Lora is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-17","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/control-lora","open_weight":true,"tagline":"Control Lora is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":0,"last_modified":"2023-08-19","last_updated":"2026-05-11"},{"id":"cosxl","name":"Cosxl","created_by":"stability","source":"official","description":"Cosxl is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-04-08","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/cosxl","open_weight":true,"tagline":"Cosxl is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":0,"last_modified":"2024-04-13","last_updated":"2026-05-11"},{"id":"japanese-instructblip-alpha","name":"Japanese Instructblip Alpha","created_by":"stability","source":"official","description":"Japanese Instructblip Alpha is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-15","model_type":"code","license":"other","page_url":"https://huggingface.co/stabilityai/japanese-instructblip-alpha","open_weight":true,"tagline":"Japanese Instructblip Alpha is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":49,"last_modified":"2023-11-17","last_updated":"2026-06-30"},{"id":"japanese-stable-clip-vit-l-16","name":"Japanese Stable Clip Vit L 16","created_by":"stability","source":"official","description":"Japanese Stable Clip Vit L 16 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-01","model_type":"code","license":"other","page_url":"https://huggingface.co/stabilityai/japanese-stable-clip-vit-l-16","open_weight":true,"tagline":"Japanese Stable Clip Vit L 16 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":1579,"last_modified":"2024-07-10","last_updated":"2026-06-30"},{"id":"japanese-stable-diffusion-xl","name":"Japanese Stable Diffusion Xl","created_by":"stability","source":"official","description":"Japanese Stable Diffusion Xl is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-01","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/japanese-stable-diffusion-xl","open_weight":true,"tagline":"Japanese Stable Diffusion Xl is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":45,"last_modified":"2024-07-10","last_updated":"2026-06-29"},{"id":"japanese-stable-vlm","name":"Japanese Stable Vlm","created_by":"stability","source":"official","description":"Japanese Stable Vlm is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-01","model_type":"code","license":"other","page_url":"https://huggingface.co/stabilityai/japanese-stable-vlm","open_weight":true,"tagline":"Japanese Stable Vlm is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":14,"last_modified":"2024-07-10","last_updated":"2026-06-30"},{"id":"japanese-stablelm-2-base-1_6b","name":"Japanese Stablelm 2 Base 1 6b","created_by":"stability","source":"official","description":"Japanese Stablelm 2 Base 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-05-02","model_type":"chat","license":"other","parameters":6,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-2-base-1_6b","open_weight":true,"tagline":"Japanese Stablelm 2 Base 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":3,"last_modified":"2024-05-02","last_updated":"2026-06-03"},{"id":"japanese-stablelm-2-instruct-1_6b","name":"Japanese Stablelm 2 Instruct 1 6b","created_by":"stability","source":"official","description":"Japanese Stablelm 2 Instruct 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-05-02","model_type":"chat","license":"other","parameters":6,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-2-instruct-1_6b","open_weight":true,"tagline":"Japanese Stablelm 2 Instruct 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":68,"last_modified":"2024-07-10","last_updated":"2026-06-03"},{"id":"japanese-stablelm-3b-4e1t-base","name":"Japanese Stablelm 3b 4e1t Base","created_by":"stability","source":"official","description":"Japanese Stablelm 3b 4e1t Base is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-16","model_type":"chat","license":"apache-2.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-3b-4e1t-base","open_weight":true,"tagline":"Japanese Stablelm 3b 4e1t Base is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":45,"last_modified":"2024-04-26","last_updated":"2026-06-30"},{"id":"japanese-stablelm-3b-4e1t-instruct","name":"Japanese Stablelm 3b 4e1t Instruct","created_by":"stability","source":"official","description":"Japanese Stablelm 3b 4e1t Instruct is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-16","model_type":"chat","license":"apache-2.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-3b-4e1t-instruct","open_weight":true,"tagline":"Japanese Stablelm 3b 4e1t Instruct is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":147,"last_modified":"2024-04-26","last_updated":"2026-06-30"},{"id":"japanese-stablelm-base-alpha-7b","name":"Japanese Stablelm Base Alpha 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Base Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-09","model_type":"chat","license":"apache-2.0","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-base-alpha-7b","open_weight":true,"tagline":"Japanese Stablelm Base Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":310,"last_modified":"2023-08-22","last_updated":"2026-06-30"},{"id":"japanese-stablelm-base-beta-70b","name":"Japanese Stablelm Base Beta 70b","created_by":"stability","source":"official","description":"Japanese Stablelm Base Beta 70b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-30","model_type":"chat","license":"llama2","parameters":70,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-base-beta-70b","open_weight":true,"tagline":"Japanese Stablelm Base Beta 70b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":126,"last_modified":"2023-12-19","last_updated":"2026-06-30"},{"id":"japanese-stablelm-base-beta-7b","name":"Japanese Stablelm Base Beta 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Base Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-30","model_type":"chat","license":"llama2","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-base-beta-7b","open_weight":true,"tagline":"Japanese Stablelm Base Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":48,"last_modified":"2023-12-19","last_updated":"2026-06-30"},{"id":"japanese-stablelm-base-gamma-7b","name":"Japanese Stablelm Base Gamma 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Base Gamma 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-16","model_type":"chat","license":"apache-2.0","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-base-gamma-7b","open_weight":true,"tagline":"Japanese Stablelm Base Gamma 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":141,"last_modified":"2024-01-25","last_updated":"2026-06-29"},{"id":"japanese-stablelm-base-ja_vocab-beta-7b","name":"Japanese Stablelm Base Ja Vocab Beta 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Base Ja Vocab Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-30","model_type":"chat","license":"llama2","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-base-ja_vocab-beta-7b","open_weight":true,"tagline":"Japanese Stablelm Base Ja Vocab Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":39,"last_modified":"2023-12-19","last_updated":"2026-06-30"},{"id":"japanese-stablelm-instruct-alpha-7b-v2","name":"Japanese Stablelm Instruct Alpha 7b V2","created_by":"stability","source":"official","description":"Japanese Stablelm Instruct Alpha 7b V2 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-09-26","model_type":"chat","license":"apache-2.0","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-instruct-alpha-7b-v2","open_weight":true,"tagline":"Japanese Stablelm Instruct Alpha 7b V2 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":38,"last_modified":"2023-10-06","last_updated":"2026-06-30"},{"id":"japanese-stablelm-instruct-alpha-7b","name":"Japanese Stablelm Instruct Alpha 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Instruct Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-10","model_type":"chat","license":"other","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-instruct-alpha-7b","open_weight":true,"tagline":"Japanese Stablelm Instruct Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":0,"last_modified":"2023-08-22","last_updated":"2026-05-11"},{"id":"japanese-stablelm-instruct-beta-70b","name":"Japanese Stablelm Instruct Beta 70b","created_by":"stability","source":"official","description":"Japanese Stablelm Instruct Beta 70b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-30","model_type":"chat","license":"llama2","parameters":70,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-instruct-beta-70b","open_weight":true,"tagline":"Japanese Stablelm Instruct Beta 70b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":131,"last_modified":"2023-12-19","last_updated":"2026-06-29"},{"id":"japanese-stablelm-instruct-beta-7b","name":"Japanese Stablelm Instruct Beta 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Instruct Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-30","model_type":"chat","license":"llama2","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-instruct-beta-7b","open_weight":true,"tagline":"Japanese Stablelm Instruct Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":58,"last_modified":"2023-12-19","last_updated":"2026-06-29"},{"id":"japanese-stablelm-instruct-gamma-7b","name":"Japanese Stablelm Instruct Gamma 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Instruct Gamma 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-16","model_type":"chat","license":"apache-2.0","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-instruct-gamma-7b","open_weight":true,"tagline":"Japanese Stablelm Instruct Gamma 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":151,"last_modified":"2024-01-24","last_updated":"2026-06-29"},{"id":"japanese-stablelm-instruct-ja_vocab-beta-7b","name":"Japanese Stablelm Instruct Ja Vocab Beta 7b","created_by":"stability","source":"official","description":"Japanese Stablelm Instruct Ja Vocab Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-10-30","model_type":"chat","license":"llama2","parameters":7,"page_url":"https://huggingface.co/stabilityai/japanese-stablelm-instruct-ja_vocab-beta-7b","open_weight":true,"tagline":"Japanese Stablelm Instruct Ja Vocab Beta 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":44,"last_modified":"2023-12-19","last_updated":"2026-06-30"},{"id":"SAME-L","name":"SAME L","created_by":"stability","source":"official","description":"SAME L is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-17","model_type":"code","license":"other","page_url":"https://huggingface.co/stabilityai/SAME-L","open_weight":true,"tagline":"SAME L is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":6334,"last_modified":"2026-06-24","last_updated":"2026-06-30"},{"id":"SAME-S","name":"SAME S","created_by":"stability","source":"official","description":"SAME S is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-17","model_type":"code","license":"other","page_url":"https://huggingface.co/stabilityai/SAME-S","open_weight":true,"tagline":"SAME S is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":1587,"last_modified":"2026-05-19","last_updated":"2026-06-30"},{"id":"sd-turbo","name":"Sd Turbo","created_by":"stability","source":"official","description":"Sd Turbo is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-27","model_type":"image","page_url":"https://huggingface.co/stabilityai/sd-turbo","open_weight":true,"tagline":"Sd Turbo is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":684119,"last_modified":"2024-07-10","last_updated":"2026-06-30"},{"id":"sd-vae-ft-ema-original","name":"Sd Vae Ft Ema Original","created_by":"stability","source":"official","description":"Sd Vae Ft Ema Original is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2022-10-13","model_type":"image","license":"mit","page_url":"https://huggingface.co/stabilityai/sd-vae-ft-ema-original","open_weight":true,"tagline":"Sd Vae Ft Ema Original is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":0,"last_modified":"2022-12-19","last_updated":"2026-05-11"},{"id":"sd-vae-ft-ema","name":"Sd Vae Ft Ema","created_by":"stability","source":"official","description":"Sd Vae Ft Ema is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2022-10-13","model_type":"other","license":"mit","page_url":"https://huggingface.co/stabilityai/sd-vae-ft-ema","open_weight":true,"tagline":"Sd Vae Ft Ema is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":6837,"last_modified":"2023-06-05","last_updated":"2026-06-30"},{"id":"sd-vae-ft-mse-original","name":"Sd Vae Ft Mse Original","created_by":"stability","source":"official","description":"Sd Vae Ft Mse Original is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2022-10-13","model_type":"image","license":"mit","page_url":"https://huggingface.co/stabilityai/sd-vae-ft-mse-original","open_weight":true,"tagline":"Sd Vae Ft Mse Original is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":1,"last_modified":"2022-12-19","last_updated":"2026-06-29"},{"id":"sd-vae-ft-mse","name":"Sd Vae Ft Mse","created_by":"stability","source":"official","description":"Sd Vae Ft Mse is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2022-10-13","model_type":"other","license":"mit","page_url":"https://huggingface.co/stabilityai/sd-vae-ft-mse","open_weight":true,"tagline":"Sd Vae Ft Mse is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":102400,"last_modified":"2023-06-06","last_updated":"2026-06-30"},{"id":"sd-x2-latent-upscaler","name":"Sd X2 Latent Upscaler","created_by":"stability","source":"official","description":"Sd X2 Latent Upscaler is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-02-03","model_type":"other","license":"openrail++","page_url":"https://huggingface.co/stabilityai/sd-x2-latent-upscaler","open_weight":true,"tagline":"Sd X2 Latent Upscaler is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":129146,"last_modified":"2023-06-05","last_updated":"2026-06-30"},{"id":"sdxl-turbo-ryzen-ai","name":"Sdxl Turbo Ryzen Ai","created_by":"stability","source":"official","description":"Sdxl Turbo Ryzen Ai is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-12-06","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/sdxl-turbo-ryzen-ai","open_weight":true,"tagline":"Sdxl Turbo Ryzen Ai is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":489,"last_modified":"2024-12-11","last_updated":"2026-06-29"},{"id":"sdxl-turbo-tensorrt","name":"Sdxl Turbo Tensorrt","created_by":"stability","source":"official","description":"Sdxl Turbo Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-12-28","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/sdxl-turbo-tensorrt","open_weight":true,"tagline":"Sdxl Turbo Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":30,"last_modified":"2025-10-20","last_updated":"2026-06-30"},{"id":"sdxl-turbo","name":"Sdxl Turbo","created_by":"stability","source":"official","description":"Sdxl Turbo is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-27","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/sdxl-turbo","open_weight":true,"tagline":"Sdxl Turbo is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":597950,"last_modified":"2024-07-10","last_updated":"2026-06-30"},{"id":"sdxl-vae","name":"Sdxl Vae","created_by":"stability","source":"official","description":"Sdxl Vae is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-06-21","model_type":"other","license":"mit","page_url":"https://huggingface.co/stabilityai/sdxl-vae","open_weight":true,"tagline":"Sdxl Vae is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":259409,"last_modified":"2023-08-04","last_updated":"2026-06-30"},{"id":"sp4d","name":"Sp4d","created_by":"stability","source":"official","description":"Sp4d is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-11-03","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/sp4d","open_weight":true,"tagline":"Sp4d is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":12,"last_modified":"2025-11-05","last_updated":"2026-06-30"},{"id":"stable-audio-3-medium-base","name":"Stable Audio 3 Medium Base","created_by":"stability","source":"official","description":"Stable Audio 3 Medium Base is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-17","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-3-medium-base","open_weight":true,"tagline":"Stable Audio 3 Medium Base is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":4447,"last_modified":"2026-06-16","last_updated":"2026-06-30"},{"id":"stable-audio-3-medium","name":"Stable Audio 3 Medium","created_by":"stability","source":"official","description":"Stable Audio 3 Medium is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-17","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-3-medium","open_weight":true,"tagline":"Stable Audio 3 Medium is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":57092,"last_modified":"2026-06-16","last_updated":"2026-06-30"},{"id":"stable-audio-3-small-music-base","name":"Stable Audio 3 Small Music Base","created_by":"stability","source":"official","description":"Stable Audio 3 Small Music Base is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-16","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-3-small-music-base","open_weight":true,"tagline":"Stable Audio 3 Small Music Base is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":1747,"last_modified":"2026-05-20","last_updated":"2026-06-30"},{"id":"stable-audio-3-small-music","name":"Stable Audio 3 Small Music","created_by":"stability","source":"official","description":"Stable Audio 3 Small Music is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-17","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-3-small-music","open_weight":true,"tagline":"Stable Audio 3 Small Music is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":15375,"last_modified":"2026-05-19","last_updated":"2026-06-30"},{"id":"stable-audio-3-small-sfx-base","name":"Stable Audio 3 Small Sfx Base","created_by":"stability","source":"official","description":"Stable Audio 3 Small Sfx Base is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-17","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-3-small-sfx-base","open_weight":true,"tagline":"Stable Audio 3 Small Sfx Base is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":1064,"last_modified":"2026-05-20","last_updated":"2026-06-30"},{"id":"stable-audio-3-small-sfx","name":"Stable Audio 3 Small Sfx","created_by":"stability","source":"official","description":"Stable Audio 3 Small Sfx is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-17","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-3-small-sfx","open_weight":true,"tagline":"Stable Audio 3 Small Sfx is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":12045,"last_modified":"2026-05-19","last_updated":"2026-06-30"},{"id":"stable-audio-open-1.0","name":"Stable Audio Open 1.0","created_by":"stability","source":"official","description":"Stable Audio Open 1.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-05-24","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-open-1.0","open_weight":true,"tagline":"Stable Audio Open 1.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"tool_call":true,"fine_tuning":true},"tools":["function_calling"],"huggingface_downloads":25989,"last_modified":"2025-06-19","last_updated":"2026-06-30"},{"id":"stable-audio-open-small","name":"Stable Audio Open Small","created_by":"stability","source":"official","description":"Stable Audio Open Small is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-05-12","model_type":"audio","license":"other","page_url":"https://huggingface.co/stabilityai/stable-audio-open-small","open_weight":true,"tagline":"Stable Audio Open Small is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"tool_call":true,"fine_tuning":true},"tools":["function_calling"],"huggingface_downloads":2169,"last_modified":"2025-05-27","last_updated":"2026-06-30"},{"id":"stable-cascade-prior","name":"Stable Cascade Prior","created_by":"stability","source":"official","description":"Stable Cascade Prior is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-02-12","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-cascade-prior","open_weight":true,"tagline":"Stable Cascade Prior is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":796,"last_modified":"2024-03-14","last_updated":"2026-06-30"},{"id":"stable-cascade","name":"Stable Cascade","created_by":"stability","source":"official","description":"Stable Cascade is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-02-06","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-cascade","open_weight":true,"tagline":"Stable Cascade is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":8407,"last_modified":"2024-03-16","last_updated":"2026-06-30"},{"id":"stable-code-3b","name":"Stable Code 3b","created_by":"stability","source":"official","description":"Stable Code 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-01-09","model_type":"chat","license":"other","parameters":3,"page_url":"https://huggingface.co/stabilityai/stable-code-3b","open_weight":true,"tagline":"Stable Code 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":5825,"last_modified":"2024-07-10","last_updated":"2026-06-30"},{"id":"stable-code-instruct-3b","name":"Stable Code Instruct 3b","created_by":"stability","source":"official","description":"Stable Code Instruct 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-03-06","model_type":"chat","license":"other","parameters":3,"page_url":"https://huggingface.co/stabilityai/stable-code-instruct-3b","open_weight":true,"tagline":"Stable Code Instruct 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":2318,"last_modified":"2024-07-10","last_updated":"2026-06-30"},{"id":"stable-codec-speech-16k-base","name":"Stable Codec Speech 16k Base","created_by":"stability","source":"official","description":"Stable Codec Speech 16k Base is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-01-14","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/stable-codec-speech-16k-base","open_weight":true,"tagline":"Stable Codec Speech 16k Base is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"tool_call":true,"fine_tuning":true},"tools":["function_calling"],"huggingface_downloads":1,"last_modified":"2025-01-14","last_updated":"2026-06-03"},{"id":"stable-codec-speech-16k","name":"Stable Codec Speech 16k","created_by":"stability","source":"official","description":"Stable Codec Speech 16k is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-01-10","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/stable-codec-speech-16k","open_weight":true,"tagline":"Stable Codec Speech 16k is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"tool_call":true,"fine_tuning":true},"tools":["function_calling"],"huggingface_downloads":334,"last_modified":"2025-01-10","last_updated":"2026-06-29"},{"id":"stable-diffusion-3-medium-amdnpu","name":"Stable Diffusion 3 Medium Amdnpu","created_by":"stability","source":"official","description":"Stable Diffusion 3 Medium Amdnpu is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2026-05-01","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3-medium-amdnpu","open_weight":true,"tagline":"Stable Diffusion 3 Medium Amdnpu is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":31,"last_modified":"2026-05-05","last_updated":"2026-06-30"},{"id":"stable-diffusion-3-medium-diffusers","name":"Stable Diffusion 3 Medium Diffusers","created_by":"stability","source":"official","description":"Stable Diffusion 3 Medium Diffusers is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-06-12","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3-medium-diffusers","open_weight":true,"tagline":"Stable Diffusion 3 Medium Diffusers is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":32528,"last_modified":"2024-06-19","last_updated":"2026-06-30"},{"id":"stable-diffusion-3-medium-tensorrt","name":"Stable Diffusion 3 Medium Tensorrt","created_by":"stability","source":"official","description":"Stable Diffusion 3 Medium Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-06-12","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3-medium-tensorrt","open_weight":true,"tagline":"Stable Diffusion 3 Medium Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":15,"last_modified":"2025-10-20","last_updated":"2026-06-29"},{"id":"stable-diffusion-3-medium","name":"Stable Diffusion 3 Medium","created_by":"stability","source":"official","description":"Stable Diffusion 3 Medium is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-05-30","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3-medium","open_weight":true,"tagline":"Stable Diffusion 3 Medium is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":3491,"last_modified":"2024-08-12","last_updated":"2026-06-30"},{"id":"stable-diffusion-3-medium_amdgpu","name":"Stable Diffusion 3 Medium Amdgpu","created_by":"stability","source":"official","description":"Stable Diffusion 3 Medium Amdgpu is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-02-28","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3-medium_amdgpu","open_weight":true,"tagline":"Stable Diffusion 3 Medium Amdgpu is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":0,"last_modified":"2025-07-16","last_updated":"2026-05-11"},{"id":"stable-diffusion-3.5-controlnets-tensorrt","name":"Stable Diffusion 3.5 Controlnets Tensorrt","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Controlnets Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-08-07","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-controlnets-tensorrt","open_weight":true,"tagline":"Stable Diffusion 3.5 Controlnets Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":177,"last_modified":"2025-10-20","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-controlnets","name":"Stable Diffusion 3.5 Controlnets","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Controlnets is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-11-15","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-controlnets","open_weight":true,"tagline":"Stable Diffusion 3.5 Controlnets is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":12,"last_modified":"2024-12-11","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-large-controlnet-blur","name":"Stable Diffusion 3.5 Large Controlnet Blur","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Large Controlnet Blur is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-11-25","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-large-controlnet-blur","open_weight":true,"tagline":"Stable Diffusion 3.5 Large Controlnet Blur is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":53,"last_modified":"2024-11-28","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-large-controlnet-canny","name":"Stable Diffusion 3.5 Large Controlnet Canny","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Large Controlnet Canny is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-11-25","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-large-controlnet-canny","open_weight":true,"tagline":"Stable Diffusion 3.5 Large Controlnet Canny is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":21152,"last_modified":"2024-11-28","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-large-controlnet-depth","name":"Stable Diffusion 3.5 Large Controlnet Depth","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Large Controlnet Depth is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-11-25","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-large-controlnet-depth","open_weight":true,"tagline":"Stable Diffusion 3.5 Large Controlnet Depth is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":24549,"last_modified":"2024-11-28","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-large-tensorrt","name":"Stable Diffusion 3.5 Large Tensorrt","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Large Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-05-16","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-large-tensorrt","open_weight":true,"tagline":"Stable Diffusion 3.5 Large Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":1483,"last_modified":"2025-10-20","last_updated":"2026-06-30"},{"id":"stable-diffusion-3.5-large-turbo","name":"Stable Diffusion 3.5 Large Turbo","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Large Turbo is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-10-22","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-large-turbo","open_weight":true,"tagline":"Stable Diffusion 3.5 Large Turbo is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":6991,"last_modified":"2024-10-22","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-large","name":"Stable Diffusion 3.5 Large","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Large is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-10-22","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-large","open_weight":true,"tagline":"Stable Diffusion 3.5 Large is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":26298,"last_modified":"2024-10-22","last_updated":"2026-06-29"},{"id":"stable-diffusion-3.5-medium-tensorrt","name":"Stable Diffusion 3.5 Medium Tensorrt","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Medium Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-08-07","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-medium-tensorrt","open_weight":true,"tagline":"Stable Diffusion 3.5 Medium Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":12,"last_modified":"2025-10-20","last_updated":"2026-06-30"},{"id":"stable-diffusion-3.5-medium","name":"Stable Diffusion 3.5 Medium","created_by":"stability","source":"official","description":"Stable Diffusion 3.5 Medium is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-10-29","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-3.5-medium","open_weight":true,"tagline":"Stable Diffusion 3.5 Medium is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":612474,"last_modified":"2024-10-31","last_updated":"2026-06-29"},{"id":"stable-diffusion-x4-upscaler","name":"Stable Diffusion X4 Upscaler","created_by":"stability","source":"official","description":"Stable Diffusion X4 Upscaler is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2022-11-23","model_type":"other","license":"openrail++","page_url":"https://huggingface.co/stabilityai/stable-diffusion-x4-upscaler","open_weight":true,"tagline":"Stable Diffusion X4 Upscaler is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":10040,"last_modified":"2023-07-05","last_updated":"2026-06-30"},{"id":"stable-diffusion-xl-1.0-tensorrt","name":"Stable Diffusion Xl 1.0 Tensorrt","created_by":"stability","source":"official","description":"Stable Diffusion Xl 1.0 Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-22","model_type":"image","license":"openrail++","page_url":"https://huggingface.co/stabilityai/stable-diffusion-xl-1.0-tensorrt","open_weight":true,"tagline":"Stable Diffusion Xl 1.0 Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":276,"last_modified":"2025-10-20","last_updated":"2026-06-30"},{"id":"stable-diffusion-xl-base-0.9","name":"Stable Diffusion Xl Base 0.9","created_by":"stability","source":"official","description":"Stable Diffusion Xl Base 0.9 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-06-19","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-xl-base-0.9","open_weight":true,"tagline":"Stable Diffusion Xl Base 0.9 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":51,"last_modified":"2023-07-12","last_updated":"2026-06-30"},{"id":"stable-diffusion-xl-base-1.0","name":"Stable Diffusion Xl Base 1.0","created_by":"stability","source":"official","description":"Stable Diffusion Xl Base 1.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-07-25","model_type":"image","license":"openrail++","page_url":"https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0","open_weight":true,"tagline":"Stable Diffusion Xl Base 1.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":1323188,"last_modified":"2023-10-30","last_updated":"2026-06-30"},{"id":"stable-diffusion-xl-refiner-0.9","name":"Stable Diffusion Xl Refiner 0.9","created_by":"stability","source":"official","description":"Stable Diffusion Xl Refiner 0.9 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-06-21","model_type":"image","license":"other","page_url":"https://huggingface.co/stabilityai/stable-diffusion-xl-refiner-0.9","open_weight":true,"tagline":"Stable Diffusion Xl Refiner 0.9 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":48,"last_modified":"2023-07-12","last_updated":"2026-06-30"},{"id":"stable-diffusion-xl-refiner-1.0","name":"Stable Diffusion Xl Refiner 1.0","created_by":"stability","source":"official","description":"Stable Diffusion Xl Refiner 1.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-07-26","model_type":"image","license":"openrail++","page_url":"https://huggingface.co/stabilityai/stable-diffusion-xl-refiner-1.0","open_weight":true,"tagline":"Stable Diffusion Xl Refiner 1.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["image"]},"endpoints":["images"],"huggingface_downloads":161798,"last_modified":"2023-09-25","last_updated":"2026-06-30"},{"id":"stable-fast-3d","name":"Stable Fast 3d","created_by":"stability","source":"official","description":"Stable Fast 3d is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-07-17","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/stable-fast-3d","open_weight":true,"tagline":"Stable Fast 3d is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"huggingface_downloads":11721,"last_modified":"2025-04-08","last_updated":"2026-06-30"},{"id":"stable-point-aware-3d","name":"Stable Point Aware 3d","created_by":"stability","source":"official","description":"Stable Point Aware 3d is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-12-28","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/stable-point-aware-3d","open_weight":true,"tagline":"Stable Point Aware 3d is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"huggingface_downloads":2132,"last_modified":"2025-04-08","last_updated":"2026-06-29"},{"id":"stable-video-diffusion-img2vid-xt-1-1-tensorrt","name":"Stable Video Diffusion Img2vid Xt 1 1 Tensorrt","created_by":"stability","source":"official","description":"Stable Video Diffusion Img2vid Xt 1 1 Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-03-07","model_type":"video","license":"other","page_url":"https://huggingface.co/stabilityai/stable-video-diffusion-img2vid-xt-1-1-tensorrt","open_weight":true,"tagline":"Stable Video Diffusion Img2vid Xt 1 1 Tensorrt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"huggingface_downloads":20,"last_modified":"2025-10-20","last_updated":"2026-06-29"},{"id":"stable-video-diffusion-img2vid-xt-1-1","name":"Stable Video Diffusion Img2vid Xt 1 1","created_by":"stability","source":"official","description":"Stable Video Diffusion Img2vid Xt 1 1 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-02-02","model_type":"video","license":"other","page_url":"https://huggingface.co/stabilityai/stable-video-diffusion-img2vid-xt-1-1","open_weight":true,"tagline":"Stable Video Diffusion Img2vid Xt 1 1 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"huggingface_downloads":7755,"last_modified":"2024-07-10","last_updated":"2026-06-30"},{"id":"stable-video-diffusion-img2vid-xt","name":"Stable Video Diffusion Img2vid Xt","created_by":"stability","source":"official","description":"Stable Video Diffusion Img2vid Xt is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-20","model_type":"video","license":"other","page_url":"https://huggingface.co/stabilityai/stable-video-diffusion-img2vid-xt","open_weight":true,"tagline":"Stable Video Diffusion Img2vid Xt is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"huggingface_downloads":216367,"last_modified":"2024-07-10","last_updated":"2026-06-30"},{"id":"stable-video-diffusion-img2vid","name":"Stable Video Diffusion Img2vid","created_by":"stability","source":"official","description":"Stable Video Diffusion Img2vid is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-20","model_type":"video","license":"other","page_url":"https://huggingface.co/stabilityai/stable-video-diffusion-img2vid","open_weight":true,"tagline":"Stable Video Diffusion Img2vid is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"huggingface_downloads":31140,"last_modified":"2024-07-10","last_updated":"2026-06-30"},{"id":"stable-virtual-camera","name":"Stable Virtual Camera","created_by":"stability","source":"official","description":"Stable Virtual Camera is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-02-19","model_type":"video","license":"other","page_url":"https://huggingface.co/stabilityai/stable-virtual-camera","open_weight":true,"tagline":"Stable Virtual Camera is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"huggingface_downloads":9634,"last_modified":"2025-06-03","last_updated":"2026-06-29"},{"id":"stable-zero123","name":"Stable Zero123","created_by":"stability","source":"official","description":"Stable Zero123 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-12-08","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/stable-zero123","open_weight":true,"tagline":"Stable Zero123 is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":0,"last_modified":"2024-07-10","last_updated":"2026-05-11"},{"id":"StableBeluga-13B","name":"StableBeluga 13B","created_by":"stability","source":"official","description":"StableBeluga 13B is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-07-27","model_type":"chat","parameters":13,"page_url":"https://huggingface.co/stabilityai/StableBeluga-13B","open_weight":true,"tagline":"StableBeluga 13B is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":257,"last_modified":"2023-08-29","last_updated":"2026-06-30"},{"id":"StableBeluga-7B","name":"StableBeluga 7B","created_by":"stability","source":"official","description":"StableBeluga 7B is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-07-27","model_type":"chat","parameters":7,"page_url":"https://huggingface.co/stabilityai/StableBeluga-7B","open_weight":true,"tagline":"StableBeluga 7B is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":248,"last_modified":"2023-08-29","last_updated":"2026-06-30"},{"id":"StableBeluga1-Delta","name":"StableBeluga1 Delta","created_by":"stability","source":"official","description":"StableBeluga1 Delta is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-07-20","model_type":"chat","license":"cc-by-nc-4.0","page_url":"https://huggingface.co/stabilityai/StableBeluga1-Delta","open_weight":true,"tagline":"StableBeluga1 Delta is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":145,"last_modified":"2023-07-27","last_updated":"2026-06-29"},{"id":"StableBeluga2","name":"StableBeluga2","created_by":"stability","source":"official","description":"StableBeluga2 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-07-20","model_type":"chat","page_url":"https://huggingface.co/stabilityai/StableBeluga2","open_weight":true,"tagline":"StableBeluga2 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":761,"last_modified":"2023-09-18","last_updated":"2026-06-30"},{"id":"stablecode-completion-alpha-3b-4k","name":"Stablecode Completion Alpha 3b 4k","created_by":"stability","source":"official","description":"Stablecode Completion Alpha 3b 4k is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-07","model_type":"chat","license":"apache-2.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablecode-completion-alpha-3b-4k","open_weight":true,"tagline":"Stablecode Completion Alpha 3b 4k is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":1092,"last_modified":"2023-08-08","last_updated":"2026-06-30"},{"id":"stablecode-completion-alpha-3b","name":"Stablecode Completion Alpha 3b","created_by":"stability","source":"official","description":"Stablecode Completion Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-07-31","model_type":"chat","license":"apache-2.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablecode-completion-alpha-3b","open_weight":true,"tagline":"Stablecode Completion Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":385,"last_modified":"2023-08-08","last_updated":"2026-06-30"},{"id":"stablecode-instruct-alpha-3b","name":"Stablecode Instruct Alpha 3b","created_by":"stability","source":"official","description":"Stablecode Instruct Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-07","model_type":"chat","license":"other","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablecode-instruct-alpha-3b","open_weight":true,"tagline":"Stablecode Instruct Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":4,"last_modified":"2023-08-08","last_updated":"2026-06-29"},{"id":"stablelm-2-12b-chat-GGUF","name":"Stablelm 2 12b Chat GGUF","created_by":"stability","source":"official","description":"Stablelm 2 12b Chat GGUF is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-04-17","model_type":"chat","license":"other","parameters":12,"page_url":"https://huggingface.co/stabilityai/stablelm-2-12b-chat-GGUF","open_weight":true,"tagline":"Stablelm 2 12b Chat GGUF is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"tool_call":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"tools":["function_calling"],"huggingface_downloads":176,"last_modified":"2024-04-20","last_updated":"2026-06-30"},{"id":"stablelm-2-12b-chat","name":"Stablelm 2 12b Chat","created_by":"stability","source":"official","description":"Stablelm 2 12b Chat is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-04-04","model_type":"chat","license":"other","parameters":12,"page_url":"https://huggingface.co/stabilityai/stablelm-2-12b-chat","open_weight":true,"tagline":"Stablelm 2 12b Chat is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"tool_call":true,"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"tools":["function_calling"],"huggingface_downloads":260,"last_modified":"2024-05-20","last_updated":"2026-06-30"},{"id":"stablelm-2-12b","name":"Stablelm 2 12b","created_by":"stability","source":"official","description":"Stablelm 2 12b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-03-21","model_type":"chat","license":"other","parameters":12,"page_url":"https://huggingface.co/stabilityai/stablelm-2-12b","open_weight":true,"tagline":"Stablelm 2 12b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":3321,"last_modified":"2024-07-10","last_updated":"2026-06-30"},{"id":"stablelm-2-1_6b-chat","name":"Stablelm 2 1 6b Chat","created_by":"stability","source":"official","description":"Stablelm 2 1 6b Chat is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-04-08","model_type":"chat","license":"other","parameters":6,"page_url":"https://huggingface.co/stabilityai/stablelm-2-1_6b-chat","open_weight":true,"tagline":"Stablelm 2 1 6b Chat is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":867,"last_modified":"2024-06-03","last_updated":"2026-06-30"},{"id":"stablelm-2-1_6b","name":"Stablelm 2 1 6b","created_by":"stability","source":"official","description":"Stablelm 2 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-01-18","model_type":"chat","license":"other","parameters":6,"page_url":"https://huggingface.co/stabilityai/stablelm-2-1_6b","open_weight":true,"tagline":"Stablelm 2 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":10913,"last_modified":"2024-07-10","last_updated":"2026-06-30"},{"id":"stablelm-2-zephyr-1_6b","name":"Stablelm 2 Zephyr 1 6b","created_by":"stability","source":"official","description":"Stablelm 2 Zephyr 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-01-19","model_type":"chat","license":"other","parameters":6,"page_url":"https://huggingface.co/stabilityai/stablelm-2-zephyr-1_6b","open_weight":true,"tagline":"Stablelm 2 Zephyr 1 6b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":3299,"last_modified":"2024-06-03","last_updated":"2026-06-30"},{"id":"stablelm-3b-4e1t","name":"Stablelm 3b 4e1t","created_by":"stability","source":"official","description":"Stablelm 3b 4e1t is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-09-29","model_type":"chat","license":"cc-by-sa-4.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablelm-3b-4e1t","open_weight":true,"tagline":"Stablelm 3b 4e1t is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":93032,"last_modified":"2024-03-07","last_updated":"2026-06-30"},{"id":"stablelm-base-alpha-3b-v2","name":"Stablelm Base Alpha 3b V2","created_by":"stability","source":"official","description":"Stablelm Base Alpha 3b V2 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-04","model_type":"chat","license":"cc-by-sa-4.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablelm-base-alpha-3b-v2","open_weight":true,"tagline":"Stablelm Base Alpha 3b V2 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":528,"last_modified":"2023-09-11","last_updated":"2026-06-30"},{"id":"stablelm-base-alpha-3b","name":"Stablelm Base Alpha 3b","created_by":"stability","source":"official","description":"Stablelm Base Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-04-17","model_type":"chat","license":"cc-by-sa-4.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablelm-base-alpha-3b","open_weight":true,"tagline":"Stablelm Base Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":2984,"last_modified":"2023-10-19","last_updated":"2026-06-30"},{"id":"stablelm-base-alpha-7b-v2","name":"Stablelm Base Alpha 7b V2","created_by":"stability","source":"official","description":"Stablelm Base Alpha 7b V2 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-08-04","model_type":"chat","license":"cc-by-sa-4.0","parameters":7,"page_url":"https://huggingface.co/stabilityai/stablelm-base-alpha-7b-v2","open_weight":true,"tagline":"Stablelm Base Alpha 7b V2 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":457,"last_modified":"2023-09-11","last_updated":"2026-06-29"},{"id":"stablelm-base-alpha-7b","name":"Stablelm Base Alpha 7b","created_by":"stability","source":"official","description":"Stablelm Base Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-04-11","model_type":"chat","license":"cc-by-sa-4.0","parameters":7,"page_url":"https://huggingface.co/stabilityai/stablelm-base-alpha-7b","open_weight":true,"tagline":"Stablelm Base Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":974,"last_modified":"2023-10-19","last_updated":"2026-06-30"},{"id":"stablelm-tuned-alpha-3b","name":"Stablelm Tuned Alpha 3b","created_by":"stability","source":"official","description":"Stablelm Tuned Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-04-19","model_type":"chat","license":"cc-by-nc-sa-4.0","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablelm-tuned-alpha-3b","open_weight":true,"tagline":"Stablelm Tuned Alpha 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":819,"last_modified":"2023-04-19","last_updated":"2026-06-30"},{"id":"stablelm-tuned-alpha-7b","name":"Stablelm Tuned Alpha 7b","created_by":"stability","source":"official","description":"Stablelm Tuned Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-04-19","model_type":"chat","license":"cc-by-nc-sa-4.0","parameters":7,"page_url":"https://huggingface.co/stabilityai/stablelm-tuned-alpha-7b","open_weight":true,"tagline":"Stablelm Tuned Alpha 7b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":5821,"last_modified":"2023-04-19","last_updated":"2026-06-30"},{"id":"stablelm-zephyr-3b","name":"Stablelm Zephyr 3b","created_by":"stability","source":"official","description":"Stablelm Zephyr 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2023-11-21","model_type":"chat","license":"other","parameters":3,"page_url":"https://huggingface.co/stabilityai/stablelm-zephyr-3b","open_weight":true,"tagline":"Stablelm Zephyr 3b is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true,"fine_tuning":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":28462,"last_modified":"2024-07-10","last_updated":"2026-06-30"},{"id":"sv3d","name":"Sv3d","created_by":"stability","source":"official","description":"Sv3d is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-03-18","model_type":"video","license":"other","page_url":"https://huggingface.co/stabilityai/sv3d","open_weight":true,"tagline":"Sv3d is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["video"],"huggingface_downloads":0,"last_modified":"2024-07-10","last_updated":"2026-05-11"},{"id":"sv4d","name":"Sv4d","created_by":"stability","source":"official","description":"Sv4d is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-07-16","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/sv4d","open_weight":true,"tagline":"Sv4d is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":27,"last_modified":"2024-08-03","last_updated":"2026-06-29"},{"id":"sv4d2.0","name":"Sv4d2.0","created_by":"stability","source":"official","description":"Sv4d2.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2025-02-20","model_type":"other","license":"other","page_url":"https://huggingface.co/stabilityai/sv4d2.0","open_weight":true,"tagline":"Sv4d2.0 is a Stability AI model published on the official Stability AI Hugging Face organization.","huggingface_downloads":365,"last_modified":"2025-04-04","last_updated":"2026-06-29"},{"id":"tiny-random-stablelm-2","name":"Tiny Random Stablelm 2","created_by":"stability","source":"official","description":"Tiny Random Stablelm 2 is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-03-20","model_type":"chat","page_url":"https://huggingface.co/stabilityai/tiny-random-stablelm-2","open_weight":true,"tagline":"Tiny Random Stablelm 2 is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["chat_completions"],"huggingface_downloads":1395,"last_modified":"2024-03-31","last_updated":"2026-06-30"},{"id":"TripoSR","name":"TripoSR","created_by":"stability","source":"official","description":"TripoSR is a Stability AI model published on the official Stability AI Hugging Face organization.","status":"active","release_date":"2024-02-29","model_type":"other","license":"mit","page_url":"https://huggingface.co/stabilityai/TripoSR","open_weight":true,"tagline":"TripoSR is a Stability AI model published on the official Stability AI Hugging Face organization.","capabilities":{"vision":true,"fine_tuning":true},"huggingface_downloads":188532,"last_modified":"2024-08-09","last_updated":"2026-06-30"}]}; export const models: Model[] = provider.models.map((m) => ({ ...m, provider: provider.id })); diff --git a/packages/npm/src/providers/vertex.ts b/packages/npm/src/providers/vertex.ts index cd109298d..8b3cab289 100644 --- a/packages/npm/src/providers/vertex.ts +++ b/packages/npm/src/providers/vertex.ts @@ -3,6 +3,6 @@ import type { ProviderWithModels, Model } from '../types'; -export const provider: ProviderWithModels = {"id":"vertex","name":"Google Vertex AI","region":"US","headquarters":"Mountain View, CA","url":"https://cloud.google.com/vertex-ai","api_url":"https://us-central1-aiplatform.googleapis.com/v1","docs_url":"https://docs.cloud.google.com/vertex-ai/generative-ai/docs/models","pricing_url":"https://cloud.google.com/vertex-ai/generative-ai/pricing","description":"Google Cloud Vertex AI provides enterprise access to Gemini, Claude, Llama, and Mistral models.","type":"cloud","playground_url":"https://console.cloud.google.com/vertex-ai/generative","status_url":"https://status.cloud.google.com","sdk":{"python":"google-cloud-aiplatform","javascript":"@google-cloud/vertexai"},"openai_compatible":true,"free_tier":false,"models_url":"https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models","twitter_url":"https://x.com/GoogleDeepMind","blog_url":"https://cloud.google.com/blog/products/ai-machine-learning","terms_url":"https://cloud.google.com/terms/service-terms","support_url":"https://cloud.google.com/vertex-ai/docs/support/getting-support","icon":"\n \n \n \n \n \n \n \n \n","models":[{"id":"antigravity-preview-05-2026","name":"antigravity-preview-05-2026","created_by":"google","source":"official","status":"active","context_window":1048576,"max_output_tokens":65536,"license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-05-23"},{"id":"claude-haiku-4-5@vertex","name":"Claude Haiku 4.5","created_by":"anthropic","source":"official","last_updated":"2026-03-23","family":"claude-haiku","context_window":200000,"max_output_tokens":64000,"capabilities":{"streaming":true,"vision":true,"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.1,"output":5.5,"cached_input":0.11,"batch_input":0.55,"batch_output":2.75,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.1,0.11,5.5]},{"label":"Batch","values":[0.55,null,2.75]}]}]},"model_type":"chat","tools":["function_calling"],"description":"The fastest model with near-frontier intelligence","tagline":"The fastest model with near-frontier intelligence","knowledge_cutoff":"2025-02","training_data_cutoff":"2025-07","license":"proprietary","open_weight":false},{"id":"claude-opus-4-6@vertex","name":"Claude Opus 4.6","created_by":"anthropic","source":"official","last_updated":"2026-03-23","family":"claude-opus","context_window":1000000,"max_output_tokens":128000,"capabilities":{"streaming":true,"vision":true,"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5.5,"output":27.5,"cached_input":0.55,"batch_input":2.75,"batch_output":13.75,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[5.5,0.55,27.5]},{"label":"Batch","values":[2.75,null,13.75]}]}]},"model_type":"chat","tools":["function_calling"],"description":"The most intelligent broadly available model for agents and coding","tagline":"The most intelligent model for building agents and coding","knowledge_cutoff":"2025-05","training_data_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"claude-sonnet-4-6@vertex","name":"Claude Sonnet 4.6","created_by":"anthropic","source":"official","last_updated":"2026-03-23","family":"claude-sonnet","context_window":1000000,"max_output_tokens":64000,"capabilities":{"streaming":true,"vision":true,"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":3.3,"output":16.5,"cached_input":0.33,"batch_input":1.65,"batch_output":8.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[3.3,0.33,16.5]},{"label":"Batch","values":[1.65,null,8.25]}]}]},"model_type":"chat","tools":["function_calling"],"description":"The best combination of speed and intelligence","tagline":"The best combination of speed and intelligence","knowledge_cutoff":"2025-08","training_data_cutoff":"2026-01","license":"proprietary","open_weight":false},{"id":"deep-research-max-preview-04-2026","name":"deep-research-max-preview-04-2026","created_by":"google","source":"official","family":"deep-research","status":"active","context_window":1048576,"max_output_tokens":65536,"model_type":"reasoning","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-04-22"},{"id":"deep-research-preview-04-2026","name":"deep-research-preview-04-2026","created_by":"google","source":"official","family":"deep-research","status":"active","context_window":1048576,"max_output_tokens":65536,"model_type":"reasoning","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-04-22"},{"id":"deep-research-pro-preview-12-2025","name":"deep-research-pro-preview-12-2025","created_by":"google","source":"official","last_updated":"2026-04-22","status":"active","context_window":1048576,"max_output_tokens":65536,"model_type":"reasoning","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"deep-research","license":"proprietary","open_weight":false},{"id":"embedding-001","name":"embedding-001","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","model_type":"embed","successor":"gemini-embedding-2","modalities":{"input":["text"],"output":["text"]},"family":"embed","license":"proprietary","open_weight":false},{"id":"embedding-gecko-001","name":"embedding-gecko-001","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","model_type":"embed","successor":"gemini-embedding-2","modalities":{"input":["text"],"output":["text"]},"family":"embed","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-001","name":"gemini-2.0-flash-001","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.15,null,0.6]}]}]},"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.5-flash"},{"id":"gemini-2.0-flash-lite-001","name":"gemini-2.0-flash-lite-001","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.15,null,0.6]}]}]},"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.1-flash-lite"},{"id":"gemini-2.0-flash-lite-preview-02-05","name":"gemini-2.0-flash-lite-preview-02-05","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-2.5-flash-lite","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.15,null,0.6]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-lite-preview","name":"gemini-2.0-flash-lite-preview","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-2.5-flash-lite","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.15,null,0.6]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-lite","name":"gemini-2.0-flash-lite","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","knowledge_cutoff":"2024-08","context_window":1048576,"max_output_tokens":8192,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.25,"output":0.075,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.075,null,0.3]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.1-flash-lite"},{"id":"gemini-2.0-flash-live-001","name":"gemini-2.0-flash-live-001","created_by":"google","source":"official","last_updated":"2026-03-27","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-3.1-flash-live-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.15,null,0.6]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-preview-image-generation","name":"gemini-2.0-flash-preview-image-generation","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-11-14","successor":"gemini-2.5-flash-image","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.15,null,0.6]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash","name":"gemini-2.0-flash","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","knowledge_cutoff":"2024-08","context_window":1048576,"max_output_tokens":8192,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.25,"output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.15,null,0.6]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.5-flash"},{"id":"gemini-2.5-computer-use-preview-10-2025","name":"gemini-2.5-computer-use-preview-10-2025","created_by":"google","source":"official","last_updated":"2026-04-22","family":"gemini-2.5","status":"active","context_window":128000,"max_output_tokens":64000,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-image-preview","name":"gemini-2.5-flash-image-preview","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2026-01-15","successor":"gemini-2.5-flash-image","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-image","name":"gemini-2.5-flash-image","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-06","context_window":65536,"max_output_tokens":32768,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[null,null,null]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Image (Nano Banana) Our best engine for high-velocity visual creation, offering state-of-the-art speed and efficiency. Gemini 2.5 Flash Image, also known as Nano Banana, is best for high-volume generation, conversational image editing, and low-latency creative workflows that require native multimodal understanding.","tagline":"Our best engine for high-velocity visual creation, offering state-of-the-art speed and efficiency."},{"id":"gemini-2.5-flash-lite-preview-09-2025","name":"gemini-2.5-flash-lite-preview-09-2025","created_by":"google","source":"official","last_updated":"2026-05-10","family":"gemini-2.5","status":"deprecated","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-03-31","successor":"gemini-3.1-flash-lite"},{"id":"gemini-2.5-flash-lite","name":"gemini-2.5-flash-lite","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.1,"output":0.4,"batch_input":0.05,"batch_output":0.2,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.1,null,0.4]},{"label":"Priority","values":[0.18,null,0.72]},{"label":"Flex","values":[0.05,null,0.2]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash-Lite Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks. Gemini 2.5 Flash-Lite is best for high-volume classification, simple data extraction, and extremely low-latency applications where budget and speed are the primary constraints.","tagline":"Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks."},{"id":"gemini-2.5-flash-native-audio-preview-12-2025","name":"gemini-2.5-flash-native-audio-preview-12-2025","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":8192,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Live Preview The Live API enables low-latency, real-time voice and video interactions with Gemini 2.5 Flash. It processes continuous streams of audio, video, or text to deliver immediate, human-like spoken responses, creating a natural conversational experience for your users.","tagline":"The Live API enables low-latency, real-time voice and video interactions with Gemini 2.5 Flash."},{"id":"gemini-2.5-flash-preview-05-20","name":"gemini-2.5-flash-preview-05-20","created_by":"google","source":"official","last_updated":"2026-05-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-11-18","successor":"gemini-3.5-flash","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-preview-09-2025","name":"gemini-2.5-flash-preview-09-2025","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-preview-09-25","name":"gemini-2.5-flash-preview-09-25","created_by":"google","source":"official","last_updated":"2026-05-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2026-02-17","successor":"gemini-3.5-flash","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-preview-tts","name":"gemini-2.5-flash-preview-tts","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","context_window":8192,"max_output_tokens":16384,"model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Text-to-Speech Our fastest engine for high-fidelity speech synthesis, offering low-latency and cost-efficient audio generation. Gemini 2.5 Flash TTS is best for real-time assistants, high-volume narration, and conversational use cases that require fine-grained control over voice style and pacing.","tagline":"Our fastest engine for high-fidelity speech synthesis, offering low-latency and cost-efficient audio generation."},{"id":"gemini-2.5-flash","name":"gemini-2.5-flash","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Our best model in terms of price-performance, offering well-rounded capabilities. 2.5 Flash is best for large scale processing, low-latency, high volume tasks that require thinking, and agentic use cases.","tagline":"Our best model in terms of price-performance, offering well-rounded capabilities."},{"id":"gemini-2.5-pro-preview-03-25","name":"gemini-2.5-pro-preview-03-25","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-12-02","successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":10,"batch_input":0.625,"batch_output":5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.25,null,10]},{"label":"Priority","values":[2.25,null,18]},{"label":"Flex","values":[0.625,null,5]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-pro-preview-05-06","name":"gemini-2.5-pro-preview-05-06","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-12-02","successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":10,"batch_input":0.625,"batch_output":5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.25,null,10]},{"label":"Priority","values":[2.25,null,18]},{"label":"Flex","values":[0.625,null,5]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-pro-preview-06-05","name":"gemini-2.5-pro-preview-06-05","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-12-02","successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":10,"batch_input":0.625,"batch_output":5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.25,null,10]},{"label":"Priority","values":[2.25,null,18]},{"label":"Flex","values":[0.625,null,5]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-pro-preview-tts","name":"gemini-2.5-pro-preview-tts","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","context_window":8192,"max_output_tokens":16384,"model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":1.25,"output":10,"batch_input":0.625,"batch_output":5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.25,null,10]},{"label":"Priority","values":[2.25,null,18]},{"label":"Flex","values":[0.625,null,5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Pro Text-to-Speech Our premium engine for studio-quality speech synthesis, offering high-fidelity and sophisticated audio generation. Gemini 2.5 Pro TTS is best for long-form content, professional narrations, and complex creative workflows that require the highest level of vocal clarity and natural prosody.","tagline":"Our premium engine for studio-quality speech synthesis, offering high-fidelity and sophisticated audio generation."},{"id":"gemini-2.5-pro","name":"gemini-2.5-pro","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":1.25,"output":10,"batch_input":0.625,"batch_output":5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.25,null,10]},{"label":"Priority","values":[2.25,null,18]},{"label":"Flex","values":[0.625,null,5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Pro Our state-of-the-art thinking model, capable of reasoning over complex problems in code, math, and STEM, as well as analyzing large datasets, codebases, and documents using long context.","tagline":"Our state-of-the-art thinking model, capable of reasoning over complex problems in code, math, and STEM, as well as analyzing large datasets, codebases, and documents using long context."},{"id":"gemini-3-flash-preview","name":"gemini-3-flash-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.5,"output":3,"batch_input":0.25,"batch_output":1.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.5,null,3]},{"label":"Priority","values":[0.9,null,5.4]},{"label":"Flex","values":[0.25,null,1.5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3 Flash Preview The best model in the world for multimodal understanding, and our most powerful agentic and vibe-coding model yet, delivering richer visuals and deeper interactivity, all built on a foundation of state-of-the-art reasoning.","tagline":"The best model in the world for multimodal understanding, and our most powerful agentic and vibe-coding model yet, delivering richer visuals and deeper interactivity, all built on a foundation of stat"},{"id":"gemini-3-pro-image-preview","name":"gemini-3-pro-image-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3","status":"deprecated","knowledge_cutoff":"2025-01","context_window":65536,"max_output_tokens":32768,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":2,"output":12,"batch_input":1,"batch_output":6,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[2,null,12]},{"label":"Priority","values":[null,null,null]},{"label":"Flex","values":[1,null,6]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-25","successor":"gemini-3-pro-image"},{"id":"gemini-3-pro-image","name":"gemini-3-pro-image","created_by":"google","source":"official","family":"gemini-3","status":"active","knowledge_cutoff":"2025-01","context_window":65536,"max_output_tokens":32768,"model_type":"chat","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":2,"output":12,"batch_input":1,"batch_output":6,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[2,null,12]},{"label":"Priority","values":[null,null,null]},{"label":"Flex","values":[1,null,6]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3 Pro Image Nano Banana Pro is a sophisticated reasoning-driven engine for professional-grade image editing and generation, offering studio-quality precision and advanced creative control. Nano Banana Pro is best for complex graphic design, high-fidelity product mockups, and factual data visualizations that require accurate text rendering and real-world grounding via Google Search.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3-pro-preview","name":"gemini-3-pro-preview","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-3","status":"deprecated","deprecation_date":"2026-03-09","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":2,"output":12,"batch_input":1,"batch_output":6,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[2,null,12]},{"label":"Priority","values":[3.6,null,21.6]},{"label":"Flex","values":[1,null,6]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-3.1-flash-image-preview","name":"gemini-3.1-flash-image-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3.1","status":"deprecated","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":32768,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.5,"output":3,"batch_input":0.25,"batch_output":1.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.5,null,3]},{"label":"Priority","values":[null,null,null]},{"label":"Flex","values":[0.25,null,1.5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-25","successor":"gemini-3.1-flash-image"},{"id":"gemini-3.1-flash-image","name":"gemini-3.1-flash-image","created_by":"google","source":"official","family":"gemini-3.1","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":32768,"model_type":"chat","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":0.5,"output":3,"batch_input":0.25,"batch_output":1.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.5,null,3]},{"label":"Priority","values":[null,null,null]},{"label":"Flex","values":[0.25,null,1.5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash Image Nano Banana 2 provides high-quality image generation and conversational editing at a mainstream price point and low latency. It serves as the high-efficiency counterpart to Gemini 3 Pro Image , optimized for speed and high-volume developer use cases. Key updates: New output resolution options: New support for 0.5K, 2K and 4K, default 1K New Image Search Grounding: Integration of both text and image search results to inform generation with real-time web data Supported with Thinking on or off New 1:4, 4:1, 1:8 and 8:1 aspect ratios Improved aspect ratio adherence Improved image quality and consistency Improved i18n text rendering","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.1-flash-lite-preview","name":"gemini-3.1-flash-lite-preview","created_by":"google","source":"official","last_updated":"2026-05-29","family":"gemini-3.1","status":"deprecated","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.25,"output":1.5,"batch_input":0.125,"batch_output":0.75,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.25,null,1.5]},{"label":"Priority","values":[0.45,null,2.7]},{"label":"Flex","values":[0.125,null,0.75]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks. Gemini 3.1 Flash-Lite is best for high-volume agentic tasks, simple data extraction, and extremely low-latency applications where budget and speed are the primary constraints.","tagline":"Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks.","deprecation_date":"2026-05-25","successor":"gemini-3.1-flash-lite"},{"id":"gemini-3.1-flash-lite","name":"gemini-3.1-flash-lite","created_by":"google","source":"official","family":"gemini-3.1","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash-Lite Gemini 3.1 Flash-Lite is a low-latency, cost-effective multimodal model optimized for high-frequency, lightweight tasks. The model supports text, image, video, audio, and PDF inputs, and is designed for high-volume agentic workflows, simple data extraction, and applications where latency and API cost are the primary constraints.","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"model_type":"chat","license":"proprietary","tagline":"The model supports text, image, video, audio, and PDF inputs, and is designed for high-volume agentic workflows, simple data extraction, and applications where latency and API cost are the primary con","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.25,"output":1.5,"batch_input":0.125,"batch_output":0.75,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.25,null,1.5]},{"label":"Priority","values":[0.45,null,2.7]},{"label":"Flex","values":[0.125,null,0.75]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29"},{"id":"gemini-3.1-flash-live-preview","name":"gemini-3.1-flash-live-preview","created_by":"google","source":"official","family":"gemini-3.1","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":65536,"model_type":"chat","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash Live Preview Gemini 3.1 Flash Live Preview is our low-latency, audio-to-audio model optimized for real-time dialogue and voice-first AI applications with acoustic nuance detection, numeric precision, and multimodal awareness.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.1-flash-tts-preview","name":"gemini-3.1-flash-tts-preview","created_by":"google","source":"official","family":"gemini-3.1","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash TTS (Text-to-Speech) Preview The Gemini 3.1 Flash TTS Preview model provides powerful, low-latency speech generation with natural outputs, steerable prompts, and new expressive audio tags for precise narration control.","status":"active","knowledge_cutoff":"2025-01","context_window":8192,"max_output_tokens":16384,"model_type":"tts","license":"proprietary","tagline":"The Gemini 3.1 Flash TTS Preview model provides powerful, low-latency speech generation with natural outputs, steerable prompts, and new expressive audio tags for precise narration control.","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29"},{"id":"gemini-3.1-pro-preview","name":"gemini-3.1-pro-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3.1","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":2,"output":12,"batch_input":1,"batch_output":6,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[2,null,12]},{"label":"Priority","values":[3.6,null,21.6]},{"label":"Flex","values":[1,null,6]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Pro Preview Built to refine the performance and reliability of the Gemini 3 Pro series, Gemini 3.1 Pro Preview provides better thinking, improved token efficiency, and a more grounded, factually consistent experience. It's optimized for software engineering behavior and usability, as well as agentic workflows requiring precise tool usage and reliable multi-step execution across real-world domains.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.5-flash","name":"gemini-3.5-flash","created_by":"google","source":"official","family":"gemini-3.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"model_type":"chat","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":1.5,"output":9,"batch_input":0.75,"batch_output":4.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.5,null,9]},{"label":"Priority","values":[2.7,null,16.2]},{"label":"Flex","values":[0.75,null,4.5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.5 Flash Gemini 3.5 Flash provides sustained frontier-level intelligence optimized for real-world tasks at a higher speed and lower cost. Designed for the agentic era, it excels at sub-agent deployment, multi-step workflows, and long-horizon tasks at scale. This model is particularly effective for rapid agentic loops involving complex coding cycles and iterations.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.5-live-translate-preview","name":"gemini-3.5-live-translate-preview","created_by":"google","source":"official","family":"gemini-3.5","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":65536,"model_type":"translation","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.5 Live Translate Gemini 3.5 Live Translate is our low-latency, audio-to-audio model optimized for real-time translation of spoken conversations. It enables seamless, bidirectional translation with high accuracy and natural voice output.","tagline":"The Interactions API is now generally available."},{"id":"gemini-embedding-001","name":"gemini-embedding-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","context_window":2048,"model_type":"embed","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"family":"gemini-embedding","license":"proprietary","open_weight":false},{"id":"gemini-embedding-2-preview","name":"gemini-embedding-2-preview","created_by":"google","source":"official","last_updated":"2026-03-23","status":"active","context_window":8192,"model_type":"embed","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"family":"gemini-embedding","license":"proprietary","open_weight":false},{"id":"gemini-embedding-2","name":"gemini-embedding-2","created_by":"google","source":"official","family":"gemini-embedding","status":"active","context_window":8192,"model_type":"embed","license":"proprietary","open_weight":false,"capabilities":{"vision":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-04-24"},{"id":"gemini-embedding-exp-03-07","name":"gemini-embedding-exp-03-07","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","model_type":"embed","successor":"gemini-embedding-2","modalities":{"input":["text"],"output":["text"]},"family":"gemini-embedding","license":"proprietary","open_weight":false},{"id":"gemini-embedding-exp","name":"gemini-embedding-exp","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","model_type":"embed","successor":"gemini-embedding-2","modalities":{"input":["text"],"output":["text"]},"family":"gemini-embedding","license":"proprietary","open_weight":false},{"id":"gemini-live-2.5-flash-preview","name":"gemini-live-2.5-flash-preview","created_by":"google","source":"official","last_updated":"2026-03-27","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-3.1-flash-live-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"family":"gemini-2.5","model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-robotics-er-1.5-preview","name":"gemini-robotics-er-1.5-preview","created_by":"google","source":"official","last_updated":"2026-06-29","status":"deprecated","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"gemini-1.5","model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-04-30","successor":"gemini-robotics-er-1.6-preview","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini Robotics-ER 1.5 Note: This version is planned for deprecation soon . See the models page for the latest model version. Gemini Robotics-ER 1.5 is a vision-language model (VLM) that brings Gemini's agentic capabilities to robotics. It's designed for advanced reasoning in the physical world, allowing robots to interpret complex visual data, perform spatial reasoning, and plan actions from natural language commands.","tagline":"The Interactions API is now generally available."},{"id":"gemini-robotics-er-1.6-preview","name":"gemini-robotics-er-1.6-preview","created_by":"google","source":"official","family":"gemini-1.6","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":65536,"model_type":"chat","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini Robotics-ER 1.6 Gemini Robotics-ER 1.6 is a vision-language model (VLM) that brings Gemini's agentic capabilities to robotics. It's designed for advanced reasoning in the physical world, allowing robots to interpret complex visual data, perform spatial reasoning, and plan actions from natural language commands.","tagline":"The Interactions API is now generally available."},{"id":"imagen-3.0-generate-002","name":"imagen-3.0-generate-002","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2025-11-10","model_type":"image","successor":"imagen-4.0-generate-001","modalities":{"input":["text"],"output":["image"]},"family":"imagen-3.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-fast-generate-001","name":"imagen-4.0-fast-generate-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-generate-001","name":"imagen-4.0-generate-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-generate-preview-06-06","name":"imagen-4.0-generate-preview-06-06","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2026-02-17","model_type":"image","successor":"imagen-4.0-generate-001","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-ultra-generate-001","name":"imagen-4.0-ultra-generate-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-ultra-generate-preview-06-06","name":"imagen-4.0-ultra-generate-preview-06-06","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2026-02-17","model_type":"image","successor":"imagen-4.0-ultra-generate-001","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen","name":"imagen","created_by":"google","source":"official","last_updated":"2026-06-29","status":"active","context_window":480,"model_type":"image","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["image"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"imagen","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Imagen 4 The Imagen 4 standard, ultra, and fast endpoints are deprecated and will be shut down on **August 17, 2026**; migrate to Gemini 3.1 Flash Image to avoid service interruptions. A high-performance engine for advanced visual synthesis, offering sophisticated creative control and photorealistic output. Use Imagen 4 for professional branding, intricate scene composition, and high-fidelity design tasks that require precise text rendering and complex lighting.","tagline":"A high-performance engine for advanced visual synthesis, offering sophisticated creative control and photorealistic output."},{"id":"jamba-1.5-large@vertex","name":"Jamba 1.5 Large","created_by":"ai21","source":"official","last_updated":"2026-03-22","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"model_type":"chat"},{"id":"jamba-1.5-mini@vertex","name":"Jamba 1.5 Mini","created_by":"ai21","source":"official","last_updated":"2026-03-22","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"model_type":"chat"},{"id":"lyria-3-clip-preview","name":"lyria-3-clip-preview","created_by":"google","source":"official","status":"active","context_window":131072,"model_type":"tts","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Lyria 3 Clip Preview Lyria 3 Clip Preview is Google's model optimized for generating short musical clips, loops, and previews. It generates 30-second high-quality, 48kHz stereo audio from text prompts or image inputs.","tagline":"The Interactions API is now generally available."},{"id":"lyria-3-pro-preview","name":"lyria-3-pro-preview","created_by":"google","source":"official","status":"active","context_window":131072,"model_type":"tts","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Lyria 3 Pro Preview Lyria 3 Pro Preview is Google's flagship music generation model. It is optimized for generating full-length songs with complex structural coherence, including multiple verses, choruses, and bridges. It generates high-quality, 48kHz stereo audio from text prompts or image inputs.","tagline":"The Interactions API is now generally available."},{"id":"lyria-realtime-exp","name":"lyria-realtime-exp","created_by":"google","source":"official","last_updated":"2026-03-24","status":"active","model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"license":"proprietary","open_weight":false},{"id":"mistral-medium-3@vertex","name":"Mistral Medium 3","created_by":"mistral","source":"official","last_updated":"2026-03-23","family":"mistral-medium","capabilities":{"streaming":true,"tool_call":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.4,"output":2,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.4,null,2]}]}]},"model_type":"chat","tools":["function_calling"]},{"id":"text-embedding-004","name":"text-embedding-004","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2026-01-14","model_type":"embed","successor":"gemini-embedding-2","modalities":{"input":["text"],"output":["text"]},"family":"text-embedding","license":"proprietary","open_weight":false},{"id":"veo-2.0-generate-001","name":"veo-2.0-generate-001","created_by":"google","source":"official","last_updated":"2026-06-29","status":"active","model_type":"video","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["video"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"veo-2.0","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 2.0 This model is deprecated and will be shut down on **June 30, 2026**; migrate to Veo 3.1 Preview or the GA models available through the Gemini Enterprise Agent Platform to avoid service interruptions. Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows. Veo 2.0 is best for standard 1080p content creation, social media assets, and high-volume video tasks that prioritize reliable character consistency and predictable sub-second generation speeds.","tagline":"Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows."},{"id":"veo-3.0-fast-generate-001","name":"veo-3.0-fast-generate-001","created_by":"google","source":"official","family":"veo-3.0","status":"active","model_type":"video","license":"proprietary","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"last_updated":"2026-06-18"},{"id":"veo-3.0-fast-generate-preview","name":"veo-3.0-fast-generate-preview","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2025-11-12","model_type":"video","successor":"veo-3.1-fast-generate-preview","modalities":{"input":["text"],"output":["video"]},"family":"veo-3.0","license":"proprietary","open_weight":false},{"id":"veo-3.0-generate-001","name":"veo-3.0-generate-001","created_by":"google","source":"official","family":"veo-3.0","status":"active","model_type":"video","license":"proprietary","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"last_updated":"2026-06-18"},{"id":"veo-3.0-generate-preview","name":"veo-3.0-generate-preview","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2025-11-12","model_type":"video","successor":"veo-3.1-generate-preview","modalities":{"input":["text"],"output":["video"]},"family":"veo-3.0","license":"proprietary","open_weight":false},{"id":"veo-3.1-fast-generate-preview","name":"veo-3.1-fast-generate-preview","created_by":"google","source":"official","family":"veo-3.1","status":"deprecated","deprecation_date":"2025-10-15","model_type":"video","license":"proprietary","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"last_updated":"2026-03-26"},{"id":"veo-3.1-generate-preview","name":"veo-3.1-generate-preview","created_by":"google","source":"official","last_updated":"2026-06-29","status":"active","context_window":1024,"model_type":"video","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["video"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"veo-3.1","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 3.1 A state-of-the-art cinematic engine designed for high-end creative storytelling and experimental video production. Veo 3.1 is best for professional-grade 4K output, natively synchronized audio generation, and complex camera movements that require the highest level of temporal consistency and artistic control.","tagline":"A state-of-the-art cinematic engine designed for high-end creative storytelling and experimental video production."},{"id":"veo-3.1-lite-generate-preview","name":"veo-3.1-lite-generate-preview","created_by":"google","source":"official","family":"veo-3.1","status":"active","context_window":1024,"model_type":"video","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 3.1 Lite Preview Veo 3.1 Lite Preview is a high-efficiency, developer-first video model providing high-fidelity video generation, editing, and cinematic control. It leverages the state-of-the-art Veo 3.1 model to democratize professional-grade video AI by offering a scalable, programmable interface for creators and enterprises.","tagline":"The Interactions API is now generally available."}]}; +export const provider: ProviderWithModels = {"id":"vertex","name":"Google Vertex AI","region":"US","headquarters":"Mountain View, CA","url":"https://cloud.google.com/vertex-ai","api_url":"https://us-central1-aiplatform.googleapis.com/v1","docs_url":"https://docs.cloud.google.com/vertex-ai/generative-ai/docs/models","pricing_url":"https://cloud.google.com/vertex-ai/generative-ai/pricing","description":"Google Cloud Vertex AI provides enterprise access to Gemini, Claude, Llama, and Mistral models.","type":"cloud","playground_url":"https://console.cloud.google.com/vertex-ai/generative","status_url":"https://status.cloud.google.com","sdk":{"python":"google-cloud-aiplatform","javascript":"@google-cloud/vertexai"},"openai_compatible":true,"free_tier":false,"models_url":"https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models","twitter_url":"https://x.com/GoogleDeepMind","blog_url":"https://cloud.google.com/blog/products/ai-machine-learning","terms_url":"https://cloud.google.com/terms/service-terms","support_url":"https://cloud.google.com/vertex-ai/docs/support/getting-support","icon":"\n \n \n \n \n \n \n \n \n","models":[{"id":"antigravity-preview-05-2026","name":"antigravity-preview-05-2026","created_by":"google","source":"official","status":"active","context_window":1048576,"max_output_tokens":65536,"license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-05-23"},{"id":"claude-haiku-4-5@vertex","name":"Claude Haiku 4.5","created_by":"anthropic","source":"official","last_updated":"2026-03-23","family":"claude-haiku","context_window":200000,"max_output_tokens":64000,"capabilities":{"streaming":true,"vision":true,"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.1,"output":5.5,"cached_input":0.11,"batch_input":0.55,"batch_output":2.75,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.1,0.11,5.5]},{"label":"Batch","values":[0.55,null,2.75]}]}]},"model_type":"chat","tools":["function_calling"],"description":"The fastest model with near-frontier intelligence","tagline":"The fastest model with near-frontier intelligence","knowledge_cutoff":"2025-02","training_data_cutoff":"2025-07","license":"proprietary","open_weight":false},{"id":"claude-opus-4-6@vertex","name":"Claude Opus 4.6","created_by":"anthropic","source":"official","last_updated":"2026-03-23","family":"claude-opus","context_window":1000000,"max_output_tokens":128000,"capabilities":{"streaming":true,"vision":true,"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":5.5,"output":27.5,"cached_input":0.55,"batch_input":2.75,"batch_output":13.75,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[5.5,0.55,27.5]},{"label":"Batch","values":[2.75,null,13.75]}]}]},"model_type":"chat","tools":["function_calling"],"description":"The most intelligent broadly available model for agents and coding","tagline":"The most intelligent model for building agents and coding","knowledge_cutoff":"2025-05","training_data_cutoff":"2025-08","license":"proprietary","open_weight":false},{"id":"claude-sonnet-4-6@vertex","name":"Claude Sonnet 4.6","created_by":"anthropic","source":"official","last_updated":"2026-03-23","family":"claude-sonnet","context_window":1000000,"max_output_tokens":64000,"capabilities":{"streaming":true,"vision":true,"tool_call":true,"reasoning":true,"structured_output":true,"json_mode":true,"batch":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":3.3,"output":16.5,"cached_input":0.33,"batch_input":1.65,"batch_output":8.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[3.3,0.33,16.5]},{"label":"Batch","values":[1.65,null,8.25]}]}]},"model_type":"chat","tools":["function_calling"],"description":"The best combination of speed and intelligence","tagline":"The best combination of speed and intelligence","knowledge_cutoff":"2025-08","training_data_cutoff":"2026-01","license":"proprietary","open_weight":false},{"id":"deep-research-max-preview-04-2026","name":"deep-research-max-preview-04-2026","created_by":"google","source":"official","family":"deep-research","status":"active","context_window":1048576,"max_output_tokens":65536,"model_type":"reasoning","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-04-22"},{"id":"deep-research-preview-04-2026","name":"deep-research-preview-04-2026","created_by":"google","source":"official","family":"deep-research","status":"active","context_window":1048576,"max_output_tokens":65536,"model_type":"reasoning","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-04-22"},{"id":"deep-research-pro-preview-12-2025","name":"deep-research-pro-preview-12-2025","created_by":"google","source":"official","last_updated":"2026-04-22","status":"active","context_window":1048576,"max_output_tokens":65536,"model_type":"reasoning","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"deep-research","license":"proprietary","open_weight":false},{"id":"embedding-001","name":"embedding-001","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","model_type":"embed","successor":"gemini-embedding-2","modalities":{"input":["text"],"output":["text"]},"family":"embed","license":"proprietary","open_weight":false},{"id":"embedding-gecko-001","name":"embedding-gecko-001","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","model_type":"embed","successor":"gemini-embedding-2","modalities":{"input":["text"],"output":["text"]},"family":"embed","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-001","name":"gemini-2.0-flash-001","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.15,null,0.6]}]}]},"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.5-flash"},{"id":"gemini-2.0-flash-lite-001","name":"gemini-2.0-flash-lite-001","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.15,null,0.6]}]}]},"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.1-flash-lite"},{"id":"gemini-2.0-flash-lite-preview-02-05","name":"gemini-2.0-flash-lite-preview-02-05","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-2.5-flash-lite","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.15,null,0.6]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-lite-preview","name":"gemini-2.0-flash-lite-preview","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-2.5-flash-lite","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.15,null,0.6]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-lite","name":"gemini-2.0-flash-lite","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","knowledge_cutoff":"2024-08","context_window":1048576,"max_output_tokens":8192,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.25,"output":0.075,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.075,null,0.3]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.1-flash-lite"},{"id":"gemini-2.0-flash-live-001","name":"gemini-2.0-flash-live-001","created_by":"google","source":"official","last_updated":"2026-03-27","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-3.1-flash-live-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.15,null,0.6]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash-preview-image-generation","name":"gemini-2.0-flash-preview-image-generation","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.0","status":"deprecated","deprecation_date":"2025-11-14","successor":"gemini-2.5-flash-image","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.25,"output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.15,null,0.6]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.0-flash","name":"gemini-2.0-flash","created_by":"google","source":"official","last_updated":"2026-06-02","family":"gemini-2.0","status":"deprecated","knowledge_cutoff":"2024-08","context_window":1048576,"max_output_tokens":8192,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.25,"output":0.15,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.15,null,0.6]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-01","successor":"gemini-3.5-flash"},{"id":"gemini-2.5-computer-use-preview-10-2025","name":"gemini-2.5-computer-use-preview-10-2025","created_by":"google","source":"official","last_updated":"2026-04-22","family":"gemini-2.5","status":"active","context_window":128000,"max_output_tokens":64000,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-image-preview","name":"gemini-2.5-flash-image-preview","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2026-01-15","successor":"gemini-2.5-flash-image","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-image","name":"gemini-2.5-flash-image","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-06","context_window":65536,"max_output_tokens":32768,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[null,null,null]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Image (Nano Banana) Our best engine for high-velocity visual creation, offering state-of-the-art speed and efficiency. Gemini 2.5 Flash Image, also known as Nano Banana, is best for high-volume generation, conversational image editing, and low-latency creative workflows that require native multimodal understanding.","tagline":"Our best engine for high-velocity visual creation, offering state-of-the-art speed and efficiency."},{"id":"gemini-2.5-flash-lite-preview-09-2025","name":"gemini-2.5-flash-lite-preview-09-2025","created_by":"google","source":"official","last_updated":"2026-05-10","family":"gemini-2.5","status":"deprecated","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-03-31","successor":"gemini-3.1-flash-lite"},{"id":"gemini-2.5-flash-lite","name":"gemini-2.5-flash-lite","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.1,"output":0.4,"batch_input":0.05,"batch_output":0.2,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.1,null,0.4]},{"label":"Priority","values":[0.18,null,0.72]},{"label":"Flex","values":[0.05,null,0.2]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash-Lite Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks. Gemini 2.5 Flash-Lite is best for high-volume classification, simple data extraction, and extremely low-latency applications where budget and speed are the primary constraints.","tagline":"Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks."},{"id":"gemini-2.5-flash-native-audio-preview-12-2025","name":"gemini-2.5-flash-native-audio-preview-12-2025","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":8192,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Live Preview The Live API enables low-latency, real-time voice and video interactions with Gemini 2.5 Flash. It processes continuous streams of audio, video, or text to deliver immediate, human-like spoken responses, creating a natural conversational experience for your users.","tagline":"The Live API enables low-latency, real-time voice and video interactions with Gemini 2.5 Flash."},{"id":"gemini-2.5-flash-preview-05-20","name":"gemini-2.5-flash-preview-05-20","created_by":"google","source":"official","last_updated":"2026-05-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-11-18","successor":"gemini-3.5-flash","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-preview-09-2025","name":"gemini-2.5-flash-preview-09-2025","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-preview-09-25","name":"gemini-2.5-flash-preview-09-25","created_by":"google","source":"official","last_updated":"2026-05-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2026-02-17","successor":"gemini-3.5-flash","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-flash-preview-tts","name":"gemini-2.5-flash-preview-tts","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","context_window":8192,"max_output_tokens":16384,"model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Text-to-Speech Our fastest engine for high-fidelity speech synthesis, offering low-latency and cost-efficient audio generation. Gemini 2.5 Flash TTS is best for real-time assistants, high-volume narration, and conversational use cases that require fine-grained control over voice style and pacing.","tagline":"Our fastest engine for high-fidelity speech synthesis, offering low-latency and cost-efficient audio generation."},{"id":"gemini-2.5-flash","name":"gemini-2.5-flash","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.3,"output":2.5,"batch_input":0.15,"batch_output":1.25,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.3,null,2.5]},{"label":"Priority","values":[0.54,null,4.5]},{"label":"Flex","values":[0.15,null,1.25]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Flash Our best model in terms of price-performance, offering well-rounded capabilities. 2.5 Flash is best for large scale processing, low-latency, high volume tasks that require thinking, and agentic use cases.","tagline":"Our best model in terms of price-performance, offering well-rounded capabilities."},{"id":"gemini-2.5-pro-preview-03-25","name":"gemini-2.5-pro-preview-03-25","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-12-02","successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":10,"batch_input":0.625,"batch_output":5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.25,null,10]},{"label":"Priority","values":[2.25,null,18]},{"label":"Flex","values":[0.625,null,5]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-pro-preview-05-06","name":"gemini-2.5-pro-preview-05-06","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-12-02","successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":10,"batch_input":0.625,"batch_output":5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.25,null,10]},{"label":"Priority","values":[2.25,null,18]},{"label":"Flex","values":[0.625,null,5]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-pro-preview-06-05","name":"gemini-2.5-pro-preview-06-05","created_by":"google","source":"official","last_updated":"2026-03-23","family":"gemini-2.5","status":"deprecated","deprecation_date":"2025-12-02","successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":1.25,"output":10,"batch_input":0.625,"batch_output":5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.25,null,10]},{"label":"Priority","values":[2.25,null,18]},{"label":"Flex","values":[0.625,null,5]}]}]},"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-2.5-pro-preview-tts","name":"gemini-2.5-pro-preview-tts","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","context_window":8192,"max_output_tokens":16384,"model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":1.25,"output":10,"batch_input":0.625,"batch_output":5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.25,null,10]},{"label":"Priority","values":[2.25,null,18]},{"label":"Flex","values":[0.625,null,5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Pro Text-to-Speech Our premium engine for studio-quality speech synthesis, offering high-fidelity and sophisticated audio generation. Gemini 2.5 Pro TTS is best for long-form content, professional narrations, and complex creative workflows that require the highest level of vocal clarity and natural prosody.","tagline":"Our premium engine for studio-quality speech synthesis, offering high-fidelity and sophisticated audio generation."},{"id":"gemini-2.5-pro","name":"gemini-2.5-pro","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-2.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":1.25,"output":10,"batch_input":0.625,"batch_output":5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.25,null,10]},{"label":"Priority","values":[2.25,null,18]},{"label":"Flex","values":[0.625,null,5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 2.5 Pro Our state-of-the-art thinking model, capable of reasoning over complex problems in code, math, and STEM, as well as analyzing large datasets, codebases, and documents using long context.","tagline":"Our state-of-the-art thinking model, capable of reasoning over complex problems in code, math, and STEM, as well as analyzing large datasets, codebases, and documents using long context."},{"id":"gemini-3-flash-preview","name":"gemini-3-flash-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.5,"output":3,"batch_input":0.25,"batch_output":1.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.5,null,3]},{"label":"Priority","values":[0.9,null,5.4]},{"label":"Flex","values":[0.25,null,1.5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3 Flash Preview The best model in the world for multimodal understanding, and our most powerful agentic and vibe-coding model yet, delivering richer visuals and deeper interactivity, all built on a foundation of state-of-the-art reasoning.","tagline":"The best model in the world for multimodal understanding, and our most powerful agentic and vibe-coding model yet, delivering richer visuals and deeper interactivity, all built on a foundation of stat"},{"id":"gemini-3-pro-image-preview","name":"gemini-3-pro-image-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3","status":"deprecated","knowledge_cutoff":"2025-01","context_window":65536,"max_output_tokens":32768,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":2,"output":12,"batch_input":1,"batch_output":6,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[2,null,12]},{"label":"Priority","values":[null,null,null]},{"label":"Flex","values":[1,null,6]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-25","successor":"gemini-3-pro-image"},{"id":"gemini-3-pro-image","name":"gemini-3-pro-image","created_by":"google","source":"official","family":"gemini-3","status":"active","knowledge_cutoff":"2025-01","context_window":65536,"max_output_tokens":32768,"model_type":"chat","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":2,"output":12,"batch_input":1,"batch_output":6,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[2,null,12]},{"label":"Priority","values":[null,null,null]},{"label":"Flex","values":[1,null,6]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3 Pro Image Nano Banana Pro is a sophisticated reasoning-driven engine for professional-grade image editing and generation, offering studio-quality precision and advanced creative control. Nano Banana Pro is best for complex graphic design, high-fidelity product mockups, and factual data visualizations that require accurate text rendering and real-world grounding via Google Search.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3-pro-preview","name":"gemini-3-pro-preview","created_by":"google","source":"official","last_updated":"2026-03-24","family":"gemini-3","status":"deprecated","deprecation_date":"2026-03-09","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"successor":"gemini-3.1-pro-preview","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":2,"output":12,"batch_input":1,"batch_output":6,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[2,null,12]},{"label":"Priority","values":[3.6,null,21.6]},{"label":"Flex","values":[1,null,6]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-3.1-flash-image-preview","name":"gemini-3.1-flash-image-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3.1","status":"deprecated","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":32768,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["text"]},"pricing":{"input":0.5,"output":3,"batch_input":0.25,"batch_output":1.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.5,null,3]},{"label":"Priority","values":[null,null,null]},{"label":"Flex","values":[0.25,null,1.5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-06-25","successor":"gemini-3.1-flash-image"},{"id":"gemini-3.1-flash-image","name":"gemini-3.1-flash-image","created_by":"google","source":"official","family":"gemini-3.1","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":32768,"model_type":"chat","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"pricing":{"input":0.5,"output":3,"batch_input":0.25,"batch_output":1.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.5,null,3]},{"label":"Priority","values":[null,null,null]},{"label":"Flex","values":[0.25,null,1.5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash Image Nano Banana 2 provides high-quality image generation and conversational editing at a mainstream price point and low latency. It serves as the high-efficiency counterpart to Gemini 3 Pro Image , optimized for speed and high-volume developer use cases. Key updates: New output resolution options: New support for 0.5K, 2K and 4K, default 1K New Image Search Grounding: Integration of both text and image search results to inform generation with real-time web data Supported with Thinking on or off New 1:4, 4:1, 1:8 and 8:1 aspect ratios Improved aspect ratio adherence Improved image quality and consistency Improved i18n text rendering","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.1-flash-lite-preview","name":"gemini-3.1-flash-lite-preview","created_by":"google","source":"official","last_updated":"2026-05-29","family":"gemini-3.1","status":"deprecated","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.25,"output":1.5,"batch_input":0.125,"batch_output":0.75,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.25,null,1.5]},{"label":"Priority","values":[0.45,null,2.7]},{"label":"Flex","values":[0.125,null,0.75]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks. Gemini 3.1 Flash-Lite is best for high-volume agentic tasks, simple data extraction, and extremely low-latency applications where budget and speed are the primary constraints.","tagline":"Our most cost-efficient multimodal model, offering the fastest performance for high-frequency, lightweight tasks.","deprecation_date":"2026-05-25","successor":"gemini-3.1-flash-lite"},{"id":"gemini-3.1-flash-lite","name":"gemini-3.1-flash-lite","created_by":"google","source":"official","family":"gemini-3.1","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash-Lite Gemini 3.1 Flash-Lite is a low-latency, cost-effective multimodal model optimized for high-frequency, lightweight tasks. The model supports text, image, video, audio, and PDF inputs, and is designed for high-volume agentic workflows, simple data extraction, and applications where latency and API cost are the primary constraints.","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"model_type":"chat","license":"proprietary","tagline":"The model supports text, image, video, audio, and PDF inputs, and is designed for high-volume agentic workflows, simple data extraction, and applications where latency and API cost are the primary con","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":0.25,"output":1.5,"batch_input":0.125,"batch_output":0.75,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.25,null,1.5]},{"label":"Priority","values":[0.45,null,2.7]},{"label":"Flex","values":[0.125,null,0.75]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29"},{"id":"gemini-3.1-flash-live-preview","name":"gemini-3.1-flash-live-preview","created_by":"google","source":"official","family":"gemini-3.1","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":65536,"model_type":"chat","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash Live Preview Gemini 3.1 Flash Live Preview is our low-latency, audio-to-audio model optimized for real-time dialogue and voice-first AI applications with acoustic nuance detection, numeric precision, and multimodal awareness.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.1-flash-tts-preview","name":"gemini-3.1-flash-tts-preview","created_by":"google","source":"official","family":"gemini-3.1","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Flash TTS (Text-to-Speech) Preview The Gemini 3.1 Flash TTS Preview model provides powerful, low-latency speech generation with natural outputs, steerable prompts, and new expressive audio tags for precise narration control.","status":"active","knowledge_cutoff":"2025-01","context_window":8192,"max_output_tokens":16384,"model_type":"tts","license":"proprietary","tagline":"The Gemini 3.1 Flash TTS Preview model provides powerful, low-latency speech generation with natural outputs, steerable prompts, and new expressive audio tags for precise narration control.","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29"},{"id":"gemini-3.1-pro-preview","name":"gemini-3.1-pro-preview","created_by":"google","source":"official","last_updated":"2026-06-29","family":"gemini-3.1","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":2,"output":12,"batch_input":1,"batch_output":6,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[2,null,12]},{"label":"Priority","values":[3.6,null,21.6]},{"label":"Flex","values":[1,null,6]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"model_type":"chat","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.1 Pro Preview Built to refine the performance and reliability of the Gemini 3 Pro series, Gemini 3.1 Pro Preview provides better thinking, improved token efficiency, and a more grounded, factually consistent experience. It's optimized for software engineering behavior and usability, as well as agentic workflows requiring precise tool usage and reliable multi-step execution across real-world domains.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.5-flash","name":"gemini-3.5-flash","created_by":"google","source":"official","family":"gemini-3.5","status":"active","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"model_type":"chat","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"pricing":{"input":1.5,"output":9,"batch_input":0.75,"batch_output":4.5,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[1.5,null,9]},{"label":"Priority","values":[2.7,null,16.2]},{"label":"Flex","values":[0.75,null,4.5]}]}]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.5 Flash Gemini 3.5 Flash provides sustained frontier-level intelligence optimized for real-world tasks at a higher speed and lower cost. Designed for the agentic era, it excels at sub-agent deployment, multi-step workflows, and long-horizon tasks at scale. This model is particularly effective for rapid agentic loops involving complex coding cycles and iterations.","tagline":"The Interactions API is now generally available."},{"id":"gemini-3.5-live-translate-preview","name":"gemini-3.5-live-translate-preview","created_by":"google","source":"official","family":"gemini-3.5","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":65536,"model_type":"translation","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini 3.5 Live Translate Gemini 3.5 Live Translate is our low-latency, audio-to-audio model optimized for real-time translation of spoken conversations. It enables seamless, bidirectional translation with high accuracy and natural voice output.","tagline":"The Interactions API is now generally available."},{"id":"gemini-embedding-001","name":"gemini-embedding-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","context_window":2048,"model_type":"embed","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"family":"gemini-embedding","license":"proprietary","open_weight":false},{"id":"gemini-embedding-2-preview","name":"gemini-embedding-2-preview","created_by":"google","source":"official","last_updated":"2026-03-23","status":"active","context_window":8192,"model_type":"embed","capabilities":{"vision":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"family":"gemini-embedding","license":"proprietary","open_weight":false},{"id":"gemini-embedding-2","name":"gemini-embedding-2","created_by":"google","source":"official","family":"gemini-embedding","status":"active","context_window":8192,"model_type":"embed","license":"proprietary","open_weight":false,"capabilities":{"vision":true},"modalities":{"input":["text"],"output":["text"]},"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-04-24"},{"id":"gemini-embedding-exp-03-07","name":"gemini-embedding-exp-03-07","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","model_type":"embed","successor":"gemini-embedding-2","modalities":{"input":["text"],"output":["text"]},"family":"gemini-embedding","license":"proprietary","open_weight":false},{"id":"gemini-embedding-exp","name":"gemini-embedding-exp","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2025-10-30","model_type":"embed","successor":"gemini-embedding-2","modalities":{"input":["text"],"output":["text"]},"family":"gemini-embedding","license":"proprietary","open_weight":false},{"id":"gemini-live-2.5-flash-preview","name":"gemini-live-2.5-flash-preview","created_by":"google","source":"official","last_updated":"2026-03-27","status":"deprecated","deprecation_date":"2025-12-09","successor":"gemini-3.1-flash-live-preview","capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["text"]},"family":"gemini-2.5","model_type":"chat","license":"proprietary","open_weight":false},{"id":"gemini-robotics-er-1.5-preview","name":"gemini-robotics-er-1.5-preview","created_by":"google","source":"official","last_updated":"2026-06-29","status":"deprecated","knowledge_cutoff":"2025-01","context_window":1048576,"max_output_tokens":65536,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"gemini-1.5","model_type":"chat","license":"proprietary","open_weight":false,"deprecation_date":"2026-04-30","successor":"gemini-robotics-er-1.6-preview","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini Robotics-ER 1.5 Note: This version is planned for deprecation soon . See the models page for the latest model version. Gemini Robotics-ER 1.5 is a vision-language model (VLM) that brings Gemini's agentic capabilities to robotics. It's designed for advanced reasoning in the physical world, allowing robots to interpret complex visual data, perform spatial reasoning, and plan actions from natural language commands.","tagline":"The Interactions API is now generally available."},{"id":"gemini-robotics-er-1.6-preview","name":"gemini-robotics-er-1.6-preview","created_by":"google","source":"official","family":"gemini-1.6","status":"active","knowledge_cutoff":"2025-01","context_window":131072,"max_output_tokens":65536,"model_type":"chat","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image","video","audio"],"output":["text","image","audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Gemini Robotics-ER 1.6 Gemini Robotics-ER 1.6 is a vision-language model (VLM) that brings Gemini's agentic capabilities to robotics. It's designed for advanced reasoning in the physical world, allowing robots to interpret complex visual data, perform spatial reasoning, and plan actions from natural language commands.","tagline":"The Interactions API is now generally available."},{"id":"imagen-3.0-generate-002","name":"imagen-3.0-generate-002","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2025-11-10","model_type":"image","successor":"imagen-4.0-generate-001","modalities":{"input":["text"],"output":["image"]},"family":"imagen-3.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-fast-generate-001","name":"imagen-4.0-fast-generate-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-generate-001","name":"imagen-4.0-generate-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-generate-preview-06-06","name":"imagen-4.0-generate-preview-06-06","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2026-02-17","model_type":"image","successor":"imagen-4.0-generate-001","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-ultra-generate-001","name":"imagen-4.0-ultra-generate-001","created_by":"google","source":"official","last_updated":"2026-03-27","status":"active","model_type":"image","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen-4.0-ultra-generate-preview-06-06","name":"imagen-4.0-ultra-generate-preview-06-06","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2026-02-17","model_type":"image","successor":"imagen-4.0-ultra-generate-001","modalities":{"input":["text"],"output":["image"]},"family":"imagen-4.0","license":"proprietary","open_weight":false},{"id":"imagen","name":"imagen","created_by":"google","source":"official","last_updated":"2026-06-29","status":"active","context_window":480,"model_type":"image","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["image"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"imagen","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Imagen 4 The Imagen 4 standard, ultra, and fast endpoints are deprecated and will be shut down on **August 17, 2026**; migrate to Gemini 3.1 Flash Image to avoid service interruptions. A high-performance engine for advanced visual synthesis, offering sophisticated creative control and photorealistic output. Use Imagen 4 for professional branding, intricate scene composition, and high-fidelity design tasks that require precise text rendering and complex lighting.","tagline":"A high-performance engine for advanced visual synthesis, offering sophisticated creative control and photorealistic output."},{"id":"jamba-1.5-large@vertex","name":"Jamba 1.5 Large","created_by":"ai21","source":"official","last_updated":"2026-03-22","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"model_type":"chat"},{"id":"jamba-1.5-mini@vertex","name":"Jamba 1.5 Mini","created_by":"ai21","source":"official","last_updated":"2026-03-22","capabilities":{"streaming":true},"modalities":{"input":["text"],"output":["text"]},"model_type":"chat"},{"id":"lyria-3-clip-preview","name":"lyria-3-clip-preview","created_by":"google","source":"official","status":"active","context_window":131072,"model_type":"tts","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Lyria 3 Clip Preview Lyria 3 Clip Preview is Google's model optimized for generating short musical clips, loops, and previews. It generates 30-second high-quality, 48kHz stereo audio from text prompts or image inputs.","tagline":"The Interactions API is now generally available."},{"id":"lyria-3-pro-preview","name":"lyria-3-pro-preview","created_by":"google","source":"official","status":"active","context_window":131072,"model_type":"tts","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Lyria 3 Pro Preview Lyria 3 Pro Preview is Google's flagship music generation model. It is optimized for generating full-length songs with complex structural coherence, including multiple verses, choruses, and bridges. It generates high-quality, 48kHz stereo audio from text prompts or image inputs.","tagline":"The Interactions API is now generally available."},{"id":"lyria-realtime-exp","name":"lyria-realtime-exp","created_by":"google","source":"official","last_updated":"2026-03-24","status":"active","model_type":"tts","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text"],"output":["audio"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"license":"proprietary","open_weight":false},{"id":"mistral-medium-3@vertex","name":"Mistral Medium 3","created_by":"mistral","source":"official","last_updated":"2026-03-23","family":"mistral-medium","capabilities":{"streaming":true,"tool_call":true},"modalities":{"input":["text"],"output":["text"]},"pricing":{"input":0.4,"output":2,"tiers":[{"label":"Text tokens","unit":"Per 1M tokens","columns":["Input","Cached input","Output"],"rows":[{"label":"Standard","values":[0.4,null,2]}]}]},"model_type":"chat","tools":["function_calling"]},{"id":"text-embedding-004","name":"text-embedding-004","created_by":"google","source":"official","last_updated":"2026-06-02","status":"deprecated","deprecation_date":"2026-01-14","model_type":"embed","successor":"gemini-embedding-2","modalities":{"input":["text"],"output":["text"]},"family":"text-embedding","license":"proprietary","open_weight":false},{"id":"veo-2.0-generate-001","name":"veo-2.0-generate-001","created_by":"google","source":"official","last_updated":"2026-06-30","status":"deprecated","model_type":"video","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["video"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"veo-2.0","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 2.0 This model is deprecated and will be shut down on **June 30, 2026**; migrate to Veo 3.1 Preview or the GA models available through the Gemini Enterprise Agent Platform to avoid service interruptions. Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows. Veo 2.0 is best for standard 1080p content creation, social media assets, and high-volume video tasks that prioritize reliable character consistency and predictable sub-second generation speeds.","tagline":"Our robust and reliable stable video generation model, providing consistent performance for production-ready workflows.","deprecation_date":"2026-06-30","successor":["veo-3.1-generate-preview","the GA models on the Gemini Enterprise Agent Platf","m"]},{"id":"veo-3.0-fast-generate-001","name":"veo-3.0-fast-generate-001","created_by":"google","source":"official","family":"veo-3.0","status":"deprecated","model_type":"video","license":"proprietary","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"last_updated":"2026-06-30","deprecation_date":"2026-06-30","successor":["veo-3.1-fast-generate-preview","the GA models on the Gemini Enterprise Agent Platf","m"]},{"id":"veo-3.0-fast-generate-preview","name":"veo-3.0-fast-generate-preview","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2025-11-12","model_type":"video","successor":"veo-3.1-fast-generate-preview","modalities":{"input":["text"],"output":["video"]},"family":"veo-3.0","license":"proprietary","open_weight":false},{"id":"veo-3.0-generate-001","name":"veo-3.0-generate-001","created_by":"google","source":"official","family":"veo-3.0","status":"deprecated","model_type":"video","license":"proprietary","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"last_updated":"2026-06-30","deprecation_date":"2026-06-30","successor":["veo-3.1-generate-preview","the GA models on the Gemini Enterprise Agent Platf","m"]},{"id":"veo-3.0-generate-preview","name":"veo-3.0-generate-preview","created_by":"google","source":"official","last_updated":"2026-03-23","status":"deprecated","deprecation_date":"2025-11-12","model_type":"video","successor":"veo-3.1-generate-preview","modalities":{"input":["text"],"output":["video"]},"family":"veo-3.0","license":"proprietary","open_weight":false},{"id":"veo-3.1-fast-generate-preview","name":"veo-3.1-fast-generate-preview","created_by":"google","source":"official","family":"veo-3.1","status":"deprecated","deprecation_date":"2025-10-15","model_type":"video","license":"proprietary","open_weight":false,"modalities":{"input":["text"],"output":["video"]},"last_updated":"2026-03-26"},{"id":"veo-3.1-generate-preview","name":"veo-3.1-generate-preview","created_by":"google","source":"official","last_updated":"2026-06-29","status":"active","context_window":1024,"model_type":"video","capabilities":{"streaming":true,"tool_call":true,"structured_output":true,"reasoning":true,"batch":true,"vision":true,"json_mode":true},"modalities":{"input":["text","image"],"output":["video"]},"tools":["function_calling"],"endpoints":["generateContent","streamGenerateContent"],"family":"veo-3.1","license":"proprietary","open_weight":false,"description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 3.1 A state-of-the-art cinematic engine designed for high-end creative storytelling and experimental video production. Veo 3.1 is best for professional-grade 4K output, natively synchronized audio generation, and complex camera movements that require the highest level of temporal consistency and artistic control.","tagline":"A state-of-the-art cinematic engine designed for high-end creative storytelling and experimental video production."},{"id":"veo-3.1-lite-generate-preview","name":"veo-3.1-lite-generate-preview","created_by":"google","source":"official","family":"veo-3.1","status":"active","context_window":1024,"model_type":"video","license":"proprietary","open_weight":false,"capabilities":{"streaming":true,"vision":true},"modalities":{"input":["text","image"],"output":["video"]},"endpoints":["generateContent","streamGenerateContent"],"last_updated":"2026-06-29","description":"The Interactions API is now generally available. We recommend using this API for access to all the latest features and models. Home Gemini API Docs Send feedback Veo 3.1 Lite Preview Veo 3.1 Lite Preview is a high-efficiency, developer-first video model providing high-fidelity video generation, editing, and cinematic control. It leverages the state-of-the-art Veo 3.1 model to democratize professional-grade video AI by offering a scalable, programmable interface for creators and enterprises.","tagline":"The Interactions API is now generally available."}]}; export const models: Model[] = provider.models.map((m) => ({ ...m, provider: provider.id }));