0:{"P":null,"b":"5AXMei98nKgQS6JfJw1RG","p":"","c":["","models"],"i":false,"f":[[["",{"children":["models",{"children":["__PAGE__",{}]}]},"$undefined","$undefined",true],["",["$","$1","c",{"children":[[["$","link","0",{"rel":"stylesheet","href":"/_next/static/css/c96a51c32ff5ed25.css?dpl=dpl_EtEgBEUPhZAsvP5JoxTr2vXLJxXw","precedence":"next","crossOrigin":"$undefined","nonce":"$undefined"}],["$","link","1",{"rel":"stylesheet","href":"/_next/static/css/0def0ef1eb28b07e.css?dpl=dpl_EtEgBEUPhZAsvP5JoxTr2vXLJxXw","precedence":"next","crossOrigin":"$undefined","nonce":"$undefined"}]],"$L2"]}],{"children":["models",["$","$1","c",{"children":[null,["$","$L3",null,{"parallelRouterKey":"children","error":"$undefined","errorStyles":"$undefined","errorScripts":"$undefined","template":["$","$L4",null,{}],"templateStyles":"$undefined","templateScripts":"$undefined","notFound":"$undefined","forbidden":"$undefined","unauthorized":"$undefined"}]]}],{"children":["__PAGE__",["$","$1","c",{"children":[["$","div",null,{"className":"bg-background text-foreground","children":[["$","script",null,{"type":"application/ld+json","dangerouslySetInnerHTML":{"__html":"$5"}}],["$","$L6",null,{}],["$","main",null,{"children":[["$","section",null,{"aria-labelledby":"models-directory-heading","className":"bg-primary/5 py-12 md:py-16 dark:bg-muted/30","children":["$","div",null,{"className":"mx-auto max-w-7xl px-4 sm:px-6 lg:px-8","children":[["$","h1",null,{"id":"models-directory-heading","className":"sr-only","children":"AI Models Directory"}],["$","$L7",null,{"models":[{"slug":"anthropic/claude-opus-5","name":"Claude Opus 5","shortName":"Claude Opus 5","author":"anthropic","authorDisplay":"Anthropic","description":"Claude Opus 5 is Anthropic’s flagship model for demanding reasoning, coding, and long-horizon agentic work. It is particularly strong at end-to-end software tasks, code review and bug finding, visual analysis...","shortDescription":"Claude Opus 5 is Anthropic’s flagship model for demanding reasoning, coding, and long-horizon agentic work.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":1,"createdAt":"2026-07-24T17:02:24.000Z","group":"anthropic/claude-opus-5-20260723","tier":"ultimate"},{"slug":"microsoft/mai-image-2.5-pro","name":"Microsoft: MAI-Image-2.5 Pro","shortName":"MAI-Image-2.5 Pro","author":"microsoft","authorDisplay":"Microsoft","description":"Microsoft's MAI-Image-2.5 is a high-quality image generation model available via Azure AI Foundry. It produces photorealistic and artistic images from text prompts with support for various aspect ratios.","shortDescription":"Microsoft's MAI-Image-2.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":4096,"supportsReasoning":false,"ranking":2,"createdAt":"2026-07-23T17:28:21.000Z","group":"microsoft/mai-image-2.5-pro-20260723","tier":"pro"},{"slug":"inclusionai/ling-3.0-flash:free","name":"Ling-3.0-flash","shortName":"Ling-3.0-flash","author":"inclusionai","authorDisplay":"Inclusionai","description":"*Ling-3.0-flash* is a *124B-parameter Mixture-of-Experts (MoE) model*, with approximately *5.1B parameters activated per token*. The model is designed with *token efficiency and production-scale agentic inference* as key priorities, enabling developers...","shortDescription":"*Ling-3.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":3,"createdAt":"2026-07-23T14:56:20.000Z","group":"inclusionai/ling-3.0-flash-20260723","tier":"basic"},{"slug":"poolside/laguna-s-2.1","name":"Poolside: Laguna S 2.1","shortName":"Laguna S 2.1","author":"poolside","authorDisplay":"Poolside","description":"Laguna S 2.1 is the latest coding agent model from [Poolside](). Laguna S 2.1 is a 118B total parameter model with 8B active parameters, scoring 70.2% on Terminal-Bench 2.1 and...","shortDescription":"Laguna S 2.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":4,"createdAt":"2026-07-21T16:51:23.000Z","group":"poolside/laguna-s-2.1-20260720","tier":"basic"},{"slug":"poolside/laguna-s-2.1:free","name":"Poolside: Laguna S 2.1","shortName":"Laguna S 2.1","author":"poolside","authorDisplay":"Poolside","description":"Laguna S 2.1 is the latest coding agent model from [Poolside](). Laguna S 2.1 is a 118B total parameter model with 8B active parameters, scoring 70.2% on Terminal-Bench 2.1 and...","shortDescription":"Laguna S 2.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":5,"createdAt":"2026-07-21T16:51:23.000Z","group":"poolside/laguna-s-2.1-20260720","tier":"basic"},{"slug":"google/gemini-3.6-flash","name":"Google: Gemini 3.6 Flash","shortName":"Gemini 3.6 Flash","author":"google","authorDisplay":"Google","description":"Gemini 3.6 Flash is a high-efficiency model from Google for coding, agentic workflows, and web and app development. It is designed to produce polished outputs with fewer unnecessary edits and...","shortDescription":"Gemini 3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video","file","audio"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":6,"createdAt":"2026-07-21T15:12:13.000Z","group":"google/gemini-3.6-flash-20260721","tier":"pro"},{"slug":"google/gemini-3.5-flash-lite","name":"Google: Gemini 3.5 Flash Lite","shortName":"Gemini 3.5 Flash Lite","author":"google","authorDisplay":"Google","description":"Gemini 3.5 Flash Lite is a high-efficiency model from Google with upgraded agentic capabilities. It is suited for subagents that execute focused tasks within complex, multi-agent workflows.","shortDescription":"Gemini 3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video","file","audio"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":7,"createdAt":"2026-07-21T15:12:06.000Z","group":"google/gemini-3.5-flash-lite-20260721","tier":"basic"},{"slug":"krea/krea-2-large","name":"Krea: Krea 2 Large","shortName":"Krea 2 Large","author":"krea","authorDisplay":"Krea","description":"Krea 2 Large is Krea's high-capability image generation model, more than twice the size of Krea 2 Medium. Its lighter post-training gives images a rawer, more textured, and flexible character,...","shortDescription":"Krea 2 Large is Krea's high-capability image generation model, more than twice the size of Krea 2 Medium.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":0,"supportsReasoning":false,"ranking":8,"createdAt":"2026-07-20T19:15:31.000Z","group":"krea/krea-2-large-20260720","tier":"pro"},{"slug":"krea/krea-2-medium","name":"Krea: Krea 2 Medium","shortName":"Krea 2 Medium","author":"krea","authorDisplay":"Krea","description":"Krea 2 Medium is Krea's balanced, cost-efficient image generation model and a practical starting point for a broad range of use cases. Its extensive post-training supports stable, consistent generations, with...","shortDescription":"Krea 2 Medium is Krea's balanced, cost-efficient image generation model and a practical starting point for a broad range of use cases.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":0,"supportsReasoning":false,"ranking":9,"createdAt":"2026-07-20T19:15:28.000Z","group":"krea/krea-2-medium-20260720","tier":"pro"},{"slug":"krea/krea-2-medium-turbo","name":"Krea: Krea 2 Medium Turbo","shortName":"Krea 2 Medium Turbo","author":"krea","authorDisplay":"Krea","description":"Krea 2 Medium Turbo is a distilled, speed-focused variant of Krea 2 Medium from Krea. It is designed for rapid iteration and graphic design exploration where fast generation is the...","shortDescription":"Krea 2 Medium Turbo is a distilled, speed-focused variant of Krea 2 Medium from Krea.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":0,"supportsReasoning":false,"ranking":10,"createdAt":"2026-07-20T19:15:23.000Z","group":"krea/krea-2-medium-turbo-20260720","tier":"pro"},{"slug":"meituan/longcat-2.0","name":"Meituan: LongCat 2.0","shortName":"LongCat 2.0","author":"meituan","authorDisplay":"Meituan","description":"LongCat 2.0 is a sparse mixture-of-experts language model from Meituan, with 48B active parameters out of 1.6T total. It is suited for coding, repository-level changes, long-horizon problem solving, and agentic...","shortDescription":"LongCat 2.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1048756,"supportsReasoning":true,"ranking":11,"createdAt":"2026-07-20T13:37:38.000Z","group":"meituan/longcat-2.0-20260720","tier":"basic"},{"slug":"x-ai/grok-imagine-video-1.5","name":"xAI: Grok Imagine Video 1.5","shortName":"Grok Imagine Video 1.5","author":"x-ai","authorDisplay":"xAI","description":"Grok Imagine Video 1.5 is an image-to-video generation model from xAI. It animates a starting image with an optional text prompt that can direct subject and camera motion, pacing, atmosphere,...","shortDescription":"Grok Imagine Video 1.","categories":["video","multimodal"],"inputModalities":["text","image"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":12,"createdAt":"2026-07-20T11:48:20.000Z","group":"x-ai/grok-imagine-video-1.5-20260719","tier":"pro"},{"slug":"thinkingmachines/inkling","name":"Thinking Machines: Inkling","shortName":"Inkling","author":"thinkingmachines","authorDisplay":"Thinkingmachines","description":"Inkling is an open-weight multimodal mixture-of-experts model from Thinking Machines Lab, with 41B active parameters out of 975B total. It is designed for general-purpose reasoning, coding, agentic and tool-use systems,...","shortDescription":"Inkling is an open-weight multimodal mixture-of-experts model from Thinking Machines Lab, with 41B active parameters out of 975B total.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","audio"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":13,"createdAt":"2026-07-17T22:05:56.000Z","group":"thinkingmachines/inkling-20260715","tier":"pro"},{"slug":"openrouter/auto-beta","name":"Auto Router (Beta)","shortName":"Auto Router (Beta)","author":"openrouter","authorDisplay":"Openrouter","description":"Auto Router (Beta) is a task-aware router from OpenRouter. It classifies each request, then routes it the [most popular model](/rankings#task-spend) for that task based on aggregate spend, filtered by your...","shortDescription":"Auto Router (Beta) is a task-aware router from OpenRouter.","categories":["image","text","multimodal","reasoning"],"inputModalities":["text","image","audio","file","video"],"outputModalities":["text","image"],"contextLength":2000000,"supportsReasoning":true,"ranking":14,"createdAt":"2026-07-17T17:59:25.000Z","group":"openrouter/auto-beta","tier":"basic"},{"slug":"moonshotai/kimi-k3","name":"MoonshotAI: Kimi K3","shortName":"Kimi K3","author":"moonshotai","authorDisplay":"Moonshotai","description":"Kimi K3 is a 2.8T parameter open-weight multimodal reasoning model from Moonshot AI. It is suited for complex coding, knowledge work, and long-horizon agentic workflows, and is particularly strong at...","shortDescription":"Kimi K3 is a 2.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":15,"createdAt":"2026-07-16T15:30:58.000Z","group":"moonshotai/kimi-k3-20260715","tier":"pro"},{"slug":"meta/muse-spark-1.1","name":"Meta: Muse Spark 1.1","shortName":"Muse Spark 1.1","author":"meta","authorDisplay":"Meta","description":"Muse Spark 1.1 is a multimodal reasoning model from Meta, built for agentic tasks. It accepts text, images, video, audio, and PDF documents and returns text, with a 1M-token context...","shortDescription":"Muse Spark 1.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video","file","audio"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":16,"createdAt":"2026-07-16T15:29:01.000Z","group":"meta/muse-spark-1.1-20260709","tier":"pro"},{"slug":"kwaipilot/kat-coder-air-v2.5","name":"Kwaipilot: KAT-Coder-Air V2.5","shortName":"KAT-Coder-Air V2.5","author":"kwaipilot","authorDisplay":"Kwaipilot","description":"KAT-Coder-Air V2.5 is a flagship-level Agentic Coding model that can directly hand over an entire issue or an entire business workflow to it, allowing it to autonomously locate and make...","shortDescription":"KAT-Coder-Air V2.","categories":["text","coding"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":256000,"supportsReasoning":false,"ranking":17,"createdAt":"2026-07-10T20:16:30.000Z","group":"kwaipilot/kat-coder-air-v2.5-20260710","tier":"basic"},{"slug":"kwaipilot/kat-coder-pro-v2.5","name":"Kwaipilot: KAT-Coder-Pro V2.5","shortName":"KAT-Coder-Pro V2.5","author":"kwaipilot","authorDisplay":"Kwaipilot","description":"KAT-Coder-Pro V2.5 is a flagship-level Agentic Coding model that can directly hand over an entire issue or an entire business workflow to it, allowing it to autonomously locate and make...","shortDescription":"KAT-Coder-Pro V2.","categories":["text","coding"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":256000,"supportsReasoning":false,"ranking":18,"createdAt":"2026-07-10T20:16:29.000Z","group":"kwaipilot/kat-coder-pro-v2.5-20260710","tier":"pro"},{"slug":"openai/gpt-5.6-luna-pro","name":"OpenAI: GPT-5.6 Luna Pro","shortName":"GPT-5.6 Luna Pro","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.6 Luna Pro is the same underlying model as [GPT-5.6 Luna](https://openrouter.ai/openai/gpt-5.6-luna), served with `reasoning.mode` set to `pro` for higher-quality responses on complex tasks.\n\nLearn more in OpenAI's docs: https://developers.openai.com/api/docs/guides/reasoning#reasoning-mode","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":1050000,"supportsReasoning":true,"ranking":19,"createdAt":"2026-07-09T09:54:27.000Z","group":"openai/gpt-5.6-luna-pro-20260709","tier":"pro"},{"slug":"openai/gpt-5.6-luna","name":"OpenAI: GPT-5.6 Luna","shortName":"GPT-5.6 Luna","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.6 Luna is a fast, cost-efficient model in OpenAI's GPT-5.6 series. It is suited for high-volume, latency-sensitive tasks such as chat, classification, and lightweight agentic workflows, providing capable reasoning for...","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":1050000,"supportsReasoning":true,"ranking":20,"createdAt":"2026-07-09T09:54:24.000Z","group":"openai/gpt-5.6-luna-20260709","tier":"pro"},{"slug":"openai/gpt-5.6-terra-pro","name":"OpenAI: GPT-5.6 Terra Pro","shortName":"GPT-5.6 Terra Pro","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.6 Terra Pro is the same underlying model as [GPT-5.6 Terra](https://openrouter.ai/openai/gpt-5.6-terra), served with `reasoning.mode` set to `pro` for higher-quality responses on complex tasks.\n\nLearn more in OpenAI's docs: https://developers.openai.com/api/docs/guides/reasoning#reasoning-mode","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":1050000,"supportsReasoning":true,"ranking":21,"createdAt":"2026-07-09T09:54:21.000Z","group":"openai/gpt-5.6-terra-pro-20260709","tier":"pro"},{"slug":"openai/gpt-5.6-terra","name":"OpenAI: GPT-5.6 Terra","shortName":"GPT-5.6 Terra","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.6 Terra is a balanced model in OpenAI's GPT-5.6 series, positioned between the flagship Sol tier and the cost-efficient Luna tier. It is suited for everyday coding, reasoning, and agentic...","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":1050000,"supportsReasoning":true,"ranking":22,"createdAt":"2026-07-09T09:54:17.000Z","group":"openai/gpt-5.6-terra-20260709","tier":"pro"},{"slug":"openai/gpt-5.6-sol-pro","name":"OpenAI: GPT-5.6 Sol Pro","shortName":"GPT-5.6 Sol Pro","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.6 Sol Pro is the same underlying model as [GPT-5.6 Sol](https://openrouter.ai/openai/gpt-5.6-sol), served with `reasoning.mode` set to `pro` for higher-quality responses on complex tasks.\n\nLearn more in OpenAI's docs: https://developers.openai.com/api/docs/guides/reasoning#reasoning-mode","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":1050000,"supportsReasoning":true,"ranking":23,"createdAt":"2026-07-09T09:54:14.000Z","group":"openai/gpt-5.6-sol-pro-20260709","tier":"ultimate"},{"slug":"openai/gpt-5.6-sol","name":"OpenAI: GPT-5.6 Sol","shortName":"GPT-5.6 Sol","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.6 Sol is the flagship model in OpenAI's GPT-5.6 series. It is suited for complex reasoning, coding, and agentic workflows, and is particularly strong at command-line and multi-step coding tasks...","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":1050000,"supportsReasoning":true,"ranking":24,"createdAt":"2026-07-09T09:54:10.000Z","group":"openai/gpt-5.6-sol-20260709","tier":"ultimate"},{"slug":"x-ai/grok-4.5","name":"xAI: Grok 4.5","shortName":"Grok 4.5","author":"x-ai","authorDisplay":"xAI","description":"Grok 4.5 is SpaceXAI's smartest model with frontier performance on coding, knowledge work, and STEM.","shortDescription":"Grok 4.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":500000,"supportsReasoning":true,"ranking":25,"createdAt":"2026-07-08T15:05:54.000Z","group":"x-ai/grok-4.5-20260708","tier":"pro"},{"slug":"~x-ai/grok-latest","name":"xAI: Grok Latest","shortName":"Grok Latest","author":"~x-ai","authorDisplay":"~x ai","description":"This model always redirects to the latest Grok model from xAI.","shortDescription":"This model always redirects to the latest Grok model from xAI.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":500000,"supportsReasoning":true,"ranking":26,"createdAt":"2026-07-08T14:02:40.000Z","group":"~x-ai/grok-latest","tier":"pro"},{"slug":"aion-labs/aion-3.0-mini","name":"AionLabs: Aion-3.0-Mini","shortName":"Aion-3.0-Mini","author":"aion-labs","authorDisplay":"Aion labs","description":"Aion-3.0 Mini is a multi-model roleplaying and storytelling system from AionLabs, built on the DeepSeek family of models. It uses a collaborative generation process in which multiple specialized models each...","shortDescription":"Aion-3.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":27,"createdAt":"2026-07-07T16:51:36.000Z","group":"aion-labs/aion-3.0-mini-20260707","tier":"pro"},{"slug":"aion-labs/aion-3.0","name":"AionLabs: Aion-3.0","shortName":"Aion-3.0","author":"aion-labs","authorDisplay":"Aion labs","description":"Aion-3.0 is a multi-model roleplaying and storytelling system from AionLabs, built on the GLM family of models. It uses a collaborative generation process in which multiple specialized models each contribute...","shortDescription":"Aion-3.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":28,"createdAt":"2026-07-07T16:51:35.000Z","group":"aion-labs/aion-3.0-20260707","tier":"pro"},{"slug":"tencent/hy3","name":"Tencent: Hy3","shortName":"Hy3","author":"tencent","authorDisplay":"Tencent","description":"Hy3 is a 295B-parameter Mixture-of-Experts model from Tencent (21B active, 192 experts with top-8 routing) built for reasoning, agentic workflows, and real-world production use. It supports a configurable reasoning effort:...","shortDescription":"Hy3 is a 295B-parameter Mixture-of-Experts model from Tencent (21B active, 192 experts with top-8 routing) built for reasoning, agentic workflows, and real-w...","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":29,"createdAt":"2026-07-06T13:20:48.000Z","group":"tencent/hy3-20260706","tier":"basic"},{"slug":"poolside/laguna-xs-2.1","name":"Poolside: Laguna XS 2.1","shortName":"Laguna XS 2.1","author":"poolside","authorDisplay":"Poolside","description":"Laguna XS 2.1 is the latest coding agent model in the 33B-A3B category from [Poolside](https://poolside.ai/) and a step forward from their Laguna XS.2 model (released in April 2026). It combines...","shortDescription":"Laguna XS 2.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":30,"createdAt":"2026-07-02T14:27:09.000Z","group":"poolside/laguna-xs-2.1-20260625","tier":"basic"},{"slug":"poolside/laguna-xs-2.1:free","name":"Poolside: Laguna XS 2.1","shortName":"Laguna XS 2.1","author":"poolside","authorDisplay":"Poolside","description":"Laguna XS 2.1 is the latest coding agent model in the 33B-A3B category from [Poolside](https://poolside.ai/) and a step forward from their Laguna XS.2 model (released in April 2026). It combines...","shortDescription":"Laguna XS 2.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":31,"createdAt":"2026-07-02T14:27:09.000Z","group":"poolside/laguna-xs-2.1-20260625","tier":"basic"},{"slug":"anthropic/claude-sonnet-5","name":"Anthropic: Claude Sonnet 5","shortName":"Claude Sonnet 5","author":"anthropic","authorDisplay":"Anthropic","description":"Sonnet 5 is Anthropic's most capable Sonnet-class model, with frontier performance across coding, agents, and professional work. It supports adaptive thinking with selectable reasoning effort levels (low, medium, high, max,...","shortDescription":"Sonnet 5 is Anthropic's most capable Sonnet-class model, with frontier performance across coding, agents, and professional work.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":32,"createdAt":"2026-06-30T18:11:23.000Z","group":"anthropic/claude-sonnet-5-20260630","tier":"pro"},{"slug":"google/gemini-3.1-flash-lite-image","name":"Google: Nano Banana 2 Lite (Gemini 3.1 Flash Lite Image)","shortName":"Nano Banana 2 Lite (Gemini 3.1 Flash Lite Image)","author":"google","authorDisplay":"Google","description":"Nano Banana 2 Lite (Gemini 3.1 Flash Lite Image) is Google's fastest, most cost-efficient Gemini image model, built for high-velocity developer pipelines and rapid-fire visual exploration. It delivers text-to-image generation...","shortDescription":"Nano Banana 2 Lite (Gemini 3.","categories":["image","text","multimodal","reasoning"],"inputModalities":["image","text"],"outputModalities":["image","text"],"contextLength":65536,"supportsReasoning":true,"ranking":33,"createdAt":"2026-06-30T16:33:45.000Z","group":"google/gemini-3.1-flash-lite-image-20260630","tier":"basic"},{"slug":"nex-agi/nex-n2-mini","name":"Nex AGI: Nex-N2-Mini","shortName":"Nex-N2-Mini","author":"nex-agi","authorDisplay":"Nex agi","description":"Nex-N2-Mini is an open-source agentic mixture-of-experts model from Nex AGI, the smaller sibling in the Nex-N2 series. It accepts text and image input and is built for coding, tool use,...","shortDescription":"Nex-N2-Mini is an open-source agentic mixture-of-experts model from Nex AGI, the smaller sibling in the Nex-N2 series.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":34,"createdAt":"2026-06-24T14:56:04.000Z","group":"nex-agi/nex-n2-mini","tier":"basic"},{"slug":"sakana/fugu-ultra","name":"Sakana: Fugu Ultra","shortName":"Fugu Ultra","author":"sakana","authorDisplay":"Sakana","description":"Fugu Ultra is the higher-performance model in Sakana AI's Fugu family. Rather than a single monolithic model, Fugu is a learned multi-agent orchestration system: a language model trained to route...","shortDescription":"Fugu Ultra is the higher-performance model in Sakana AI's Fugu family.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":35,"createdAt":"2026-06-24T04:45:03.000Z","group":"sakana/fugu-ultra-20260615","tier":"ultimate"},{"slug":"alibaba/happyhorse-1.1","name":"Alibaba: HappyHorse 1.1","shortName":"HappyHorse 1.1","author":"alibaba","authorDisplay":"Alibaba","description":"HappyHorse 1.1 is a video generation model from Alibaba. It generates short videos from a text prompt, a single starting image, or a set of reference images, with output up...","shortDescription":"HappyHorse 1.","categories":["video","multimodal"],"inputModalities":["text","image"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":36,"createdAt":"2026-06-24T02:54:03.000Z","group":"alibaba/happyhorse-1.1-20260624","tier":"pro"},{"slug":"openai/gpt-image-1-mini","name":"OpenAI: GPT Image 1 Mini","shortName":"GPT Image 1 Mini","author":"openai","authorDisplay":"OpenAI","description":"A cost-efficient variant of GPT Image 1 for high-quality image generation at reduced latency and cost via OpenAI's dedicated Images API.","shortDescription":"A cost-efficient variant of GPT Image 1 for high-quality image generation at reduced latency and cost via OpenAI's dedicated Images API.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":400000,"supportsReasoning":false,"ranking":37,"createdAt":"2026-06-24T01:31:53.000Z","group":"openai/gpt-image-1-mini","tier":"pro"},{"slug":"alibaba/happyhorse-1.0","name":"Alibaba: HappyHorse 1.0","shortName":"HappyHorse 1.0","author":"alibaba","authorDisplay":"Alibaba","description":"HappyHorse 1.0 is a video generation model from Alibaba. It generates short videos from a text prompt, a single starting image, or a set of reference images, with output up...","shortDescription":"HappyHorse 1.","categories":["video","multimodal"],"inputModalities":["text","image"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":38,"createdAt":"2026-06-24T00:18:44.000Z","group":"alibaba/happyhorse-1.0-20260624","tier":"pro"},{"slug":"google/gemini-3.1-flash-image","name":"Google: Nano Banana 2 (Gemini 3.1 Flash Image)","shortName":"Nano Banana 2 (Gemini 3.1 Flash Image)","author":"google","authorDisplay":"Google","description":"Gemini 3.1 Flash Image, a.k.a. \"Nano Banana 2,\" is Google’s latest state of the art image generation and editing model, delivering Pro-level visual quality at Flash speed. It combines advanced...","shortDescription":"Gemini 3.","categories":["image","text","multimodal","reasoning"],"inputModalities":["image","text"],"outputModalities":["image","text"],"contextLength":131072,"supportsReasoning":true,"ranking":39,"createdAt":"2026-06-18T03:41:05.000Z","group":"google/gemini-3.1-flash-image-20260528","tier":"pro"},{"slug":"google/gemini-3-pro-image","name":"Google: Nano Banana Pro (Gemini 3 Pro Image)","shortName":"Nano Banana Pro (Gemini 3 Pro Image)","author":"google","authorDisplay":"Google","description":"Nano Banana Pro is Google’s most advanced image-generation and editing model, built on Gemini 3 Pro. It extends the original Nano Banana with significantly improved multimodal reasoning, real-world grounding, and...","shortDescription":"Nano Banana Pro is Google’s most advanced image-generation and editing model, built on Gemini 3 Pro.","categories":["image","text","multimodal","reasoning"],"inputModalities":["image","text"],"outputModalities":["image","text"],"contextLength":131072,"supportsReasoning":true,"ranking":40,"createdAt":"2026-06-18T03:40:54.000Z","group":"google/gemini-3-pro-image-20260528","tier":"pro"},{"slug":"cohere/north-mini-code:free","name":"Cohere: North Mini Code","shortName":"North Mini Code","author":"cohere","authorDisplay":"Cohere","description":"North Mini Code is Cohere's first agentic coding model and the debut of its North family. A sparse mixture-of-experts model with 30B total parameters and 3B active, it is optimized...","shortDescription":"North Mini Code is Cohere's first agentic coding model and the debut of its North family.","categories":["text","reasoning","coding"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":256000,"supportsReasoning":true,"ranking":41,"createdAt":"2026-06-17T19:15:48.000Z","group":"cohere/north-mini-code-20260617","tier":"basic"},{"slug":"z-ai/glm-5.2","name":"Z.ai: GLM 5.2","shortName":"GLM 5.2","author":"z-ai","authorDisplay":"Z ai","description":"GLM 5.2 is a large-scale reasoning model from Z.ai. It supports text input and output with a 1M-token context window, and is suited for long-horizon agent workflows, project-level software engineering,...","shortDescription":"GLM 5.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":42,"createdAt":"2026-06-16T17:45:30.000Z","group":"z-ai/glm-5.2-20260616","tier":"pro"},{"slug":"openrouter/fusion","name":"OpenRouter: Fusion","shortName":"Fusion","author":"openrouter","authorDisplay":"Openrouter","description":"Fusion turns your prompt into a small multi-model deliberation. A panel of expert models (see below) analyzes your prompt in parallel with web search and web fetch enabled, then a...","shortDescription":"Fusion turns your prompt into a small multi-model deliberation.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":false,"ranking":43,"createdAt":"2026-06-13T17:27:27.000Z","group":"openrouter/fusion","tier":"basic"},{"slug":"moonshotai/kimi-k2.7-code","name":"MoonshotAI: Kimi K2.7 Code","shortName":"Kimi K2.7 Code","author":"moonshotai","authorDisplay":"Moonshotai","description":"MoonshotAI: Kimi K2.7 Code is a coding-focused model in Moonshot AI's Kimi K2 family, built to complete end-to-end programming tasks reliably over long contexts. It uses a native multimodal mixture-of-experts...","shortDescription":"MoonshotAI: Kimi K2.","categories":["text","multimodal","reasoning","coding"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":44,"createdAt":"2026-06-12T12:12:41.000Z","group":"moonshotai/kimi-k2.7-code-20260612","tier":"pro"},{"slug":"nex-agi/nex-n2-pro","name":"Nex AGI: Nex-N2-Pro","shortName":"Nex-N2-Pro","author":"nex-agi","authorDisplay":"Nex agi","description":"Nex-N2-Pro is an agentic mixture-of-experts model from Nex AGI, with 17B active parameters out of 397B total. Built on the Qwen3.5 architecture, it accepts text and image input and produces...","shortDescription":"Nex-N2-Pro is an agentic mixture-of-experts model from Nex AGI, with 17B active parameters out of 397B total.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":45,"createdAt":"2026-06-08T16:45:40.000Z","group":"nex-agi/nex-n2-pro","tier":"basic"},{"slug":"sourceful/riverflow-v2.5-pro","name":"Sourceful: Riverflow V2.5 Pro","shortName":"Riverflow V2.5 Pro","author":"sourceful","authorDisplay":"Sourceful","description":"Riverflow V2.5 Pro is the most powerful variant of Sourceful's Riverflow 2.5 lineup, best for top-tier control and quality-sensitive outputs. The Riverflow 2.5 series is a unified text-to-image and image-to-image...","shortDescription":"Riverflow V2.","categories":["image","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":32768,"supportsReasoning":true,"ranking":46,"createdAt":"2026-06-04T14:56:31.000Z","group":"sourceful/riverflow-v2.5-pro-20260605","tier":"pro"},{"slug":"sourceful/riverflow-v2.5-fast","name":"Sourceful: Riverflow V2.5 Fast","shortName":"Riverflow V2.5 Fast","author":"sourceful","authorDisplay":"Sourceful","description":"Riverflow V2.5 Fast is the speed-optimized variant of Sourceful's Riverflow 2.5 lineup, best for production deployments and latency-critical workflows. The Riverflow 2.5 series is a unified text-to-image and image-to-image family...","shortDescription":"Riverflow V2.","categories":["image","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":32768,"supportsReasoning":true,"ranking":47,"createdAt":"2026-06-04T14:56:23.000Z","group":"sourceful/riverflow-v2.5-fast-20260605","tier":"pro"},{"slug":"nvidia/nemotron-3.5-content-safety:free","name":"NVIDIA: Nemotron 3.5 Content Safety","shortName":"Nemotron 3.5 Content Safety","author":"nvidia","authorDisplay":"NVIDIA","description":"NVIDIA Nemotron 3.5 Content Safety is a compact 4B-parameter multimodal guardrail model from NVIDIA, fine-tuned from Google Gemma-3-4B. It moderates both inputs to and responses from LLMs and VLMs, accepting...","shortDescription":"NVIDIA Nemotron 3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":true,"ranking":48,"createdAt":"2026-06-04T14:04:24.000Z","group":"nvidia/nemotron-3.5-content-safety-20260604","tier":"basic"},{"slug":"nvidia/nemotron-3-ultra-550b-a55b","name":"NVIDIA: Nemotron 3 Ultra","shortName":"Nemotron 3 Ultra","author":"nvidia","authorDisplay":"NVIDIA","description":"NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE). Built on a hybrid Transformer-Mamba mixture-of-experts architecture, it...","shortDescription":"NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE).","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":512288,"supportsReasoning":true,"ranking":49,"createdAt":"2026-06-04T05:33:28.000Z","group":"nvidia/nemotron-3-ultra-550b-a55b-20260604","tier":"pro"},{"slug":"nvidia/nemotron-3-ultra-550b-a55b:free","name":"NVIDIA: Nemotron 3 Ultra","shortName":"Nemotron 3 Ultra","author":"nvidia","authorDisplay":"NVIDIA","description":"NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE). Built on a hybrid Transformer-Mamba mixture-of-experts architecture, it...","shortDescription":"NVIDIA Nemotron 3 Ultra is an open frontier-reasoning and orchestration model from NVIDIA, with 55B active parameters out of 550B total (MoE).","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":50,"createdAt":"2026-06-04T05:33:28.000Z","group":"nvidia/nemotron-3-ultra-550b-a55b-20260604","tier":"basic"},{"slug":"qwen/qwen3.7-plus","name":"Qwen: Qwen3.7 Plus","shortName":"Qwen3.7 Plus","author":"qwen","authorDisplay":"Qwen","description":"Qwen3.7-Plus is a cost-effective model in Alibaba's Qwen3.7 series. It supports text and image input with text output, building on the series' text capabilities with a comprehensive upgrade to its...","shortDescription":"Qwen3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":51,"createdAt":"2026-06-03T13:03:03.000Z","group":"qwen/qwen3.7-plus-20260602","tier":"pro"},{"slug":"microsoft/mai-image-2.5","name":"Microsoft: MAI-Image-2.5","shortName":"MAI-Image-2.5","author":"microsoft","authorDisplay":"Microsoft","description":"Microsoft's MAI-Image-2.5 is a high-quality image generation model available via Azure AI Foundry. It produces photorealistic and artistic images from text prompts with support for various aspect ratios.","shortDescription":"Microsoft's MAI-Image-2.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":4096,"supportsReasoning":false,"ranking":52,"createdAt":"2026-06-02T18:28:16.000Z","group":"microsoft/mai-image-2.5","tier":"pro"},{"slug":"minimax/minimax-m3","name":"MiniMax: MiniMax M3","shortName":"MiniMax M3","author":"minimax","authorDisplay":"Minimax","description":"MiniMax-M3 is a multimodal foundation model from MiniMax. It supports text, image, and video inputs with text output, a 1M-token context window, and is suited for long-horizon agentic work, coding,...","shortDescription":"MiniMax-M3 is a multimodal foundation model from MiniMax.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":53,"createdAt":"2026-05-31T16:36:14.000Z","group":"minimax/minimax-m3-20260531","tier":"basic"},{"slug":"stepfun/step-3.7-flash","name":"StepFun: Step 3.7 Flash","shortName":"Step 3.7 Flash","author":"stepfun","authorDisplay":"Stepfun","description":"Step 3.7 Flash is StepFun's latest high-efficiency multimodal Mixture-of-Experts model. It pairs a 196B-parameter language backbone with a vision encoder for native image and video understanding, activating roughly 11B parameters...","shortDescription":"Step 3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":54,"createdAt":"2026-05-28T16:17:49.000Z","group":"stepfun/step-3.7-flash-20260528","tier":"basic"},{"slug":"anthropic/claude-opus-4.8","name":"Anthropic: Claude Opus 4.8","shortName":"Claude Opus 4.8","author":"anthropic","authorDisplay":"Anthropic","description":"Claude Opus 4.8 is Anthropic's most capable generally available model in the Opus family. It supports text, image, and file inputs with text output, with reasoning support and a 1M-token...","shortDescription":"Claude Opus 4.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":55,"createdAt":"2026-05-27T18:04:51.000Z","group":"anthropic/claude-4.8-opus-20260528","tier":"ultimate"},{"slug":"qwen/qwen3.7-max","name":"Qwen: Qwen3.7 Max","shortName":"Qwen3.7 Max","author":"qwen","authorDisplay":"Qwen","description":"Qwen3.7-Max is the flagship model in Alibaba's Qwen3.7 series. It supports text input and output and is designed for agent-centric workloads, with particular strengths in coding, office and productivity tasks,...","shortDescription":"Qwen3.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":56,"createdAt":"2026-05-21T15:21:01.000Z","group":"qwen/qwen3.7-max-20260520","tier":"pro"},{"slug":"x-ai/grok-build-0.1","name":"xAI: Grok Build 0.1","shortName":"Grok Build 0.1","author":"x-ai","authorDisplay":"xAI","description":"Grok Build 0.1 is xAI’s fast coding model trained specifically for agentic software engineering workflows. It supports text and image inputs with text output, and is optimized for interactive coding...","shortDescription":"Grok Build 0.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":256000,"supportsReasoning":true,"ranking":57,"createdAt":"2026-05-20T17:28:43.000Z","group":"x-ai/grok-build-0.1-20260520","tier":"pro"},{"slug":"google/gemini-3.5-flash","name":"Google: Gemini 3.5 Flash","shortName":"Gemini 3.5 Flash","author":"google","authorDisplay":"Google","description":"Gemini 3.5 Flash is Google's high-efficiency multimodal model, bringing near-Pro level coding and reasoning at Flash-tier cost and speed. It is highly optimized for coding proficiency and parallel agentic execution...","shortDescription":"Gemini 3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video","file","audio"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":58,"createdAt":"2026-05-19T12:30:00.000Z","group":"google/gemini-3.5-flash-20260519","tier":"pro"},{"slug":"x-ai/grok-imagine-video","name":"xAI: Grok Imagine Video","shortName":"Grok Imagine Video","author":"x-ai","authorDisplay":"xAI","description":"Grok Imagine Video is xAI's fast, text-, image-, and reference-conditioned video generation model. It produces short videos (1–15 seconds, 24 fps) at 480p or 720p across seven aspect ratios -...","shortDescription":"Grok Imagine Video is xAI's fast, text-, image-, and reference-conditioned video generation model.","categories":["video","multimodal"],"inputModalities":["text","image"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":59,"createdAt":"2026-05-18T15:19:46.000Z","group":"x-ai/grok-imagine-video-20260512","tier":"pro"},{"slug":"x-ai/grok-imagine-image-quality","name":"xAI: Grok Imagine Image Quality","shortName":"Grok Imagine Image Quality","author":"x-ai","authorDisplay":"xAI","description":"Grok Imagine Image Quality is xAI's fast, high-fidelity image generation and editing model. It accepts text prompts and optional reference images, producing photorealistic outputs at 1K or 2K across a...","shortDescription":"Grok Imagine Image Quality is xAI's fast, high-fidelity image generation and editing model.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":65536,"supportsReasoning":false,"ranking":60,"createdAt":"2026-05-18T15:19:44.000Z","group":"x-ai/grok-imagine-image-quality-20260512","tier":"pro"},{"slug":"recraft/recraft-v4.1-pro-vector","name":"Recraft: Recraft V4.1 Pro Vector","shortName":"Recraft V4.1 Pro Vector","author":"recraft","authorDisplay":"Recraft","description":"Recraft V4.1 Pro Vector is the vector (SVG) variant of Recraft V4.1 Pro, tuned for high aesthetics. It supports text and image inputs and produces higher-resolution SVG image output across...","shortDescription":"Recraft V4.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":65536,"supportsReasoning":false,"ranking":61,"createdAt":"2026-05-13T21:23:15.000Z","group":"recraft/recraft-v4.1-pro-vector-20260514","tier":"pro"},{"slug":"recraft/recraft-v4.1-vector","name":"Recraft: Recraft V4.1 Vector","shortName":"Recraft V4.1 Vector","author":"recraft","authorDisplay":"Recraft","description":"Recraft V4.1 Vector is the vector (SVG) variant of Recraft V4.1, tuned for high aesthetics. It supports text and image inputs and produces SVG image output across multiple aspect ratios,...","shortDescription":"Recraft V4.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":65536,"supportsReasoning":false,"ranking":62,"createdAt":"2026-05-13T21:23:12.000Z","group":"recraft/recraft-v4.1-vector-20260514","tier":"pro"},{"slug":"recraft/recraft-v4.1-utility-pro","name":"Recraft: Recraft V4.1 Utility Pro","shortName":"Recraft V4.1 Utility Pro","author":"recraft","authorDisplay":"Recraft","description":"Recraft V4.1 Utility Pro is a general-purpose image generation model from Recraft. It supports text and image inputs with image output at ~2K resolution across multiple aspect ratios — double...","shortDescription":"Recraft V4.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":65536,"supportsReasoning":false,"ranking":63,"createdAt":"2026-05-13T21:23:09.000Z","group":"recraft/recraft-v4.1-utility-pro-20260514","tier":"pro"},{"slug":"recraft/recraft-v4.1-utility","name":"Recraft: Recraft V4.1 Utility","shortName":"Recraft V4.1 Utility","author":"recraft","authorDisplay":"Recraft","description":"Recraft V4.1 Utility is a general-purpose image generation model from Recraft. It supports text and image inputs with image output at ~1K resolution across multiple aspect ratios, with typical generation...","shortDescription":"Recraft V4.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":65536,"supportsReasoning":false,"ranking":64,"createdAt":"2026-05-13T21:23:07.000Z","group":"recraft/recraft-v4.1-utility-20260514","tier":"pro"},{"slug":"recraft/recraft-v4.1-pro","name":"Recraft: Recraft V4.1 Pro","shortName":"Recraft V4.1 Pro","author":"recraft","authorDisplay":"Recraft","description":"Recraft V4.1 Pro is an image generation model from Recraft tuned for high aesthetics. It supports text and image inputs with image output at ~2K resolution across multiple aspect ratios...","shortDescription":"Recraft V4.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":65536,"supportsReasoning":false,"ranking":65,"createdAt":"2026-05-13T21:23:04.000Z","group":"recraft/recraft-v4.1-pro-20260514","tier":"pro"},{"slug":"recraft/recraft-v4.1","name":"Recraft: Recraft V4.1","shortName":"Recraft V4.1","author":"recraft","authorDisplay":"Recraft","description":"Recraft V4.1 is an image generation model from Recraft tuned for high aesthetics. It supports text and image inputs with image output at ~1K resolution across multiple aspect ratios, with...","shortDescription":"Recraft V4.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":65536,"supportsReasoning":false,"ranking":66,"createdAt":"2026-05-13T21:23:01.000Z","group":"recraft/recraft-v4.1-20260514","tier":"pro"},{"slug":"recraft/recraft-v4-pro-vector","name":"Recraft: Recraft V4 Pro Vector","shortName":"Recraft V4 Pro Vector","author":"recraft","authorDisplay":"Recraft","description":"Recraft V4 Pro Vector is the vector (SVG) variant of Recraft V4 Pro. It supports text and image inputs and produces vector image output across multiple aspect ratios at the...","shortDescription":"Recraft V4 Pro Vector is the vector (SVG) variant of Recraft V4 Pro.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":65536,"supportsReasoning":false,"ranking":67,"createdAt":"2026-05-13T21:22:14.000Z","group":"recraft/recraft-v4-pro-vector-20260514","tier":"pro"},{"slug":"recraft/recraft-v4-vector","name":"Recraft: Recraft V4 Vector","shortName":"Recraft V4 Vector","author":"recraft","authorDisplay":"Recraft","description":"Recraft V4 Vector is the vector (SVG) variant of Recraft V4. It supports text and image inputs and produces vector image output across multiple aspect ratios. Compared to the raster...","shortDescription":"Recraft V4 Vector is the vector (SVG) variant of Recraft V4.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":65536,"supportsReasoning":false,"ranking":68,"createdAt":"2026-05-13T21:22:13.000Z","group":"recraft/recraft-v4-vector-20260514","tier":"pro"},{"slug":"perceptron/perceptron-mk1","name":"Perceptron: Perceptron Mk1","shortName":"Perceptron Mk1","author":"perceptron","authorDisplay":"Perceptron","description":"Perceptron Mk1 (Mark One) is Perceptron's highest-quality vision-language model for video and embodied reasoning.** It accepts image and video inputs paired with natural language queries, and produces detailed visual understanding...","shortDescription":"Perceptron Mk1 (Mark One) is Perceptron's highest-quality vision-language model for video and embodied reasoning.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":32768,"supportsReasoning":true,"ranking":69,"createdAt":"2026-05-12T14:43:49.000Z","group":"perceptron/perceptron-mk1-20260512","tier":"basic"},{"slug":"inclusionai/ring-2.6-1t","name":"inclusionAI: Ring-2.6-1T","shortName":"Ring-2.6-1T","author":"inclusionai","authorDisplay":"Inclusionai","description":"Ring-2.6-1T is a 1T-parameter-scale thinking model with 63B active parameters, built for real-world agent workflows that require both strong capability and operational efficiency. It is optimized for coding agents, tool...","shortDescription":"Ring-2.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":70,"createdAt":"2026-05-08T13:37:20.000Z","group":"inclusionai/ring-2.6-1t-20260508","tier":"basic"},{"slug":"recraft/recraft-v4-pro","name":"Recraft: Recraft V4 Pro","shortName":"Recraft V4 Pro","author":"recraft","authorDisplay":"Recraft","description":"Recraft V4 Pro is an image generation model from Recraft. It supports text and image inputs with image output at ~2K resolution across multiple aspect ratios, double the resolution of...","shortDescription":"Recraft V4 Pro is an image generation model from Recraft.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":65536,"supportsReasoning":false,"ranking":71,"createdAt":"2026-05-07T20:24:01.000Z","group":"recraft/recraft-v4-pro-20260413","tier":"pro"},{"slug":"recraft/recraft-v4","name":"Recraft: Recraft V4","shortName":"Recraft V4","author":"recraft","authorDisplay":"Recraft","description":"Recraft V4 is an image generation model from Recraft. It supports text and image inputs with image output at ~1K resolution across multiple aspect ratios. It delivers stronger compositional judgment,...","shortDescription":"Recraft V4 is an image generation model from Recraft.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":65536,"supportsReasoning":false,"ranking":72,"createdAt":"2026-05-07T20:23:57.000Z","group":"recraft/recraft-v4-20260413","tier":"pro"},{"slug":"recraft/recraft-v3","name":"Recraft: Recraft V3","shortName":"Recraft V3","author":"recraft","authorDisplay":"Recraft","description":"Recraft V3 is an image generation model from Recraft. It supports text and image inputs with image output at ~1K resolution across multiple aspect ratios. Supports the following `image_config` parameters:...","shortDescription":"Recraft V3 is an image generation model from Recraft.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":65536,"supportsReasoning":false,"ranking":73,"createdAt":"2026-05-07T20:23:53.000Z","group":"recraft/recraft-v3-20260413","tier":"pro"},{"slug":"google/gemini-3.1-flash-lite","name":"Google: Gemini 3.1 Flash Lite","shortName":"Gemini 3.1 Flash Lite","author":"google","authorDisplay":"Google","description":"Gemini 3.1 Flash Lite is Google’s GA high-efficiency multimodal model optimized for low-latency, high-volume workloads. It supports text, image, video, audio, and PDF inputs, and is designed for lightweight agentic...","shortDescription":"Gemini 3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video","file","audio"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":74,"createdAt":"2026-05-07T15:47:08.000Z","group":"google/gemini-3.1-flash-lite-20260507","tier":"basic"},{"slug":"openai/gpt-chat-latest","name":"OpenAI: GPT Chat Latest","shortName":"GPT Chat Latest","author":"openai","authorDisplay":"OpenAI","description":"GPT Chat Latest points to OpenAI's stable API alias `chat-latest` that always resolves to the latest Instant chat model used in ChatGPT. As OpenAI rolls out new Instant model updates...","shortDescription":"GPT Chat Latest points to OpenAI's stable API alias `chat-latest` that always resolves to the latest Instant chat model used in ChatGPT.","categories":["text","multimodal"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":400000,"supportsReasoning":false,"ranking":75,"createdAt":"2026-05-05T16:56:52.000Z","group":"openai/gpt-chat-latest-20260505","tier":"ultimate"},{"slug":"x-ai/grok-4.3","name":"xAI: Grok 4.3","shortName":"Grok 4.3","author":"x-ai","authorDisplay":"xAI","description":"Grok 4.3 is a reasoning model from xAI. It accepts text and image inputs with text output, and is suited for agentic workflows, instruction-following tasks, and applications requiring high factual...","shortDescription":"Grok 4.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":76,"createdAt":"2026-04-30T23:30:21.000Z","group":"x-ai/grok-4.3-20260430","tier":"pro"},{"slug":"ibm-granite/granite-4.1-8b","name":"IBM: Granite 4.1 8B","shortName":"Granite 4.1 8B","author":"ibm-granite","authorDisplay":"Ibm granite","description":"Granite 4.1 8B is a dense, decoder-only 8-billion-parameter language model from IBM, part of the Granite 4.1 family. It supports a 131K-token context window and is designed for enterprise tasks...","shortDescription":"Granite 4.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":77,"createdAt":"2026-04-30T19:24:31.000Z","group":"ibm-granite/granite-4.1-8b-20260429","tier":"basic"},{"slug":"mistralai/mistral-medium-3-5","name":"Mistral: Mistral Medium 3.5","shortName":"Mistral Medium 3.5","author":"mistralai","authorDisplay":"Mistral AI","description":"Mistral Medium 3.5 is a dense 128B instruction-following model from Mistral AI. It supports text and image inputs with text output, and is designed for agentic workflows, coding, and complex...","shortDescription":"Mistral Medium 3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":78,"createdAt":"2026-04-30T17:33:59.000Z","group":"mistralai/mistral-medium-3.5-20260430","tier":"pro"},{"slug":"kwaivgi/kling-v3.0-pro","name":"Kling: Video v3.0 Pro","shortName":"Video v3.0 Pro","author":"kwaivgi","authorDisplay":"Kwaivgi","description":"Kling v3.0 Pro is Kuaishou's premium video generation model, offering higher visual quality than the Standard tier. It supports text-to-video and image-to-video workflows, with first-frame and last-frame control for precise...","shortDescription":"Kling v3.","categories":["video","multimodal"],"inputModalities":["text","image"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":79,"createdAt":"2026-04-29T20:56:46.000Z","group":"kwaivgi/kling-v3.0-pro-20260429","tier":"pro"},{"slug":"kwaivgi/kling-v3.0-std","name":"Kling: Video v3.0 Standard","shortName":"Video v3.0 Standard","author":"kwaivgi","authorDisplay":"Kwaivgi","description":"Kling v3.0 Standard is a video generation model from Kuaishou. It supports text-to-video and image-to-video workflows, with first-frame and last-frame control for guided scene composition. Clips range from 3 to...","shortDescription":"Kling v3.","categories":["video","multimodal"],"inputModalities":["text","image"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":80,"createdAt":"2026-04-29T20:56:45.000Z","group":"kwaivgi/kling-v3.0-std-20260429","tier":"pro"},{"slug":"nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free","name":"NVIDIA: Nemotron 3 Nano Omni","shortName":"Nemotron 3 Nano Omni","author":"nvidia","authorDisplay":"NVIDIA","description":"NVIDIA Nemotron™ 3 Nano Omni is a 30B-A3B open multimodal model designed to function as a perception and context sub-agent in enterprise agent systems. It accepts text, image, video, and...","shortDescription":"NVIDIA Nemotron™ 3 Nano Omni is a 30B-A3B open multimodal model designed to function as a perception and context sub-agent in enterprise agent systems.","categories":["text","multimodal","reasoning"],"inputModalities":["text","audio","image","video"],"outputModalities":["text"],"contextLength":256000,"supportsReasoning":true,"ranking":81,"createdAt":"2026-04-28T16:18:15.000Z","group":"nvidia/nemotron-3-nano-omni-30b-a3b-reasoning-20260428","tier":"basic"},{"slug":"poolside/laguna-m.1","name":"Poolside: Laguna M.1","shortName":"Laguna M.1","author":"poolside","authorDisplay":"Poolside","description":"Laguna M.1 is the flagship coding agent model from [Poolside](https://poolside.ai/), optimized for complex software engineering tasks. Designed for agentic coding workflows, it supports tool calling and reasoning, with a 256K...","shortDescription":"Laguna M.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":82,"createdAt":"2026-04-28T15:01:44.000Z","group":"poolside/laguna-m.1-20260312","tier":"basic"},{"slug":"poolside/laguna-m.1:free","name":"Poolside: Laguna M.1","shortName":"Laguna M.1","author":"poolside","authorDisplay":"Poolside","description":"Laguna M.1 is the flagship coding agent model from [Poolside](https://poolside.ai/), optimized for complex software engineering tasks. Designed for agentic coding workflows, it supports tool calling and reasoning, with a 256K...","shortDescription":"Laguna M.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":83,"createdAt":"2026-04-28T15:01:44.000Z","group":"poolside/laguna-m.1-20260312","tier":"basic"},{"slug":"~anthropic/claude-haiku-latest","name":"Anthropic Claude Haiku Latest","shortName":"Anthropic Claude Haiku Latest","author":"~anthropic","authorDisplay":"~anthropic","description":"This model always redirects to the latest model in the Anthropic Claude Haiku family.","shortDescription":"This model always redirects to the latest model in the Anthropic Claude Haiku family.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":200000,"supportsReasoning":true,"ranking":84,"createdAt":"2026-04-27T19:34:52.000Z","group":"~anthropic/claude-haiku-latest","tier":"pro"},{"slug":"~openai/gpt-mini-latest","name":"OpenAI GPT Mini Latest","shortName":"OpenAI GPT Mini Latest","author":"~openai","authorDisplay":"~openai","description":"This model always redirects to the latest model in the OpenAI GPT Mini family.","shortDescription":"This model always redirects to the latest model in the OpenAI GPT Mini family.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":400000,"supportsReasoning":true,"ranking":85,"createdAt":"2026-04-27T19:34:31.000Z","group":"~openai/gpt-mini-latest","tier":"pro"},{"slug":"~google/gemini-pro-latest","name":"Google Gemini Pro Latest","shortName":"Google Gemini Pro Latest","author":"~google","authorDisplay":"~google","description":"This model always redirects to the latest model in the Google Gemini Pro family.","shortDescription":"This model always redirects to the latest model in the Google Gemini Pro family.","categories":["text","multimodal","reasoning"],"inputModalities":["audio","file","image","text","video"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":86,"createdAt":"2026-04-27T19:34:11.000Z","group":"~google/gemini-pro-latest","tier":"pro"},{"slug":"~moonshotai/kimi-latest","name":"MoonshotAI Kimi Latest","shortName":"MoonshotAI Kimi Latest","author":"~moonshotai","authorDisplay":"~moonshotai","description":"This model always redirects to the latest model in the MoonshotAI Kimi family.","shortDescription":"This model always redirects to the latest model in the MoonshotAI Kimi family.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":87,"createdAt":"2026-04-27T19:33:48.000Z","group":"~moonshotai/kimi-latest","tier":"pro"},{"slug":"~google/gemini-flash-latest","name":"Google Gemini Flash Latest","shortName":"Google Gemini Flash Latest","author":"~google","authorDisplay":"~google","description":"This model always redirects to the latest model in the Google Gemini Flash family.","shortDescription":"This model always redirects to the latest model in the Google Gemini Flash family.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video","file","audio"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":88,"createdAt":"2026-04-27T19:33:18.000Z","group":"~google/gemini-flash-latest","tier":"pro"},{"slug":"~anthropic/claude-sonnet-latest","name":"Anthropic Claude Sonnet Latest","shortName":"Anthropic Claude Sonnet Latest","author":"~anthropic","authorDisplay":"~anthropic","description":"This model always redirects to the latest model in the Anthropic Claude Sonnet family.","shortDescription":"This model always redirects to the latest model in the Anthropic Claude Sonnet family.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":89,"createdAt":"2026-04-27T19:32:48.000Z","group":"~anthropic/claude-sonnet-latest","tier":"pro"},{"slug":"~openai/gpt-latest","name":"OpenAI GPT Latest","shortName":"OpenAI GPT Latest","author":"~openai","authorDisplay":"~openai","description":"This model always redirects to the latest model in the OpenAI GPT family.","shortDescription":"This model always redirects to the latest model in the OpenAI GPT family.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":1050000,"supportsReasoning":true,"ranking":90,"createdAt":"2026-04-27T19:32:14.000Z","group":"~openai/gpt-latest","tier":"ultimate"},{"slug":"qwen/qwen3.5-plus-20260420","name":"Qwen: Qwen3.5 Plus 2026-04-20","shortName":"Qwen3.5 Plus 2026-04-20","author":"qwen","authorDisplay":"Qwen","description":"Qwen3.5 Plus (April 2026) is a large-scale multimodal language model from Alibaba. It accepts text, image, and video input and produces text output, with a 1M token context window. This...","shortDescription":"Qwen3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":91,"createdAt":"2026-04-27T03:42:48.000Z","group":"qwen/qwen3.5-plus-20260420","tier":"basic"},{"slug":"qwen/qwen3.6-flash","name":"Qwen: Qwen3.6 Flash","shortName":"Qwen3.6 Flash","author":"qwen","authorDisplay":"Qwen","description":"Qwen3.6 Flash is a fast, efficient language model from Alibaba's Qwen 3.6 series. It supports text, image, and video input with a 1M token context window. Tiered pricing kicks in...","shortDescription":"Qwen3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":92,"createdAt":"2026-04-27T03:42:42.000Z","group":"qwen/qwen3.6-flash","tier":"basic"},{"slug":"qwen/qwen3.6-35b-a3b","name":"Qwen: Qwen3.6 35B A3B","shortName":"Qwen3.6 35B A3B","author":"qwen","authorDisplay":"Qwen","description":"Qwen3.6-35B-A3B is an open-weight multimodal model from Alibaba Cloud with 35 billion total parameters and 3 billion active parameters per token. It uses a hybrid sparse mixture-of-experts architecture combining Gated...","shortDescription":"Qwen3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":93,"createdAt":"2026-04-27T03:24:15.000Z","group":"qwen/qwen3.6-35b-a3b-20260415","tier":"basic"},{"slug":"qwen/qwen3.6-max-preview","name":"Qwen: Qwen3.6 Max Preview","shortName":"Qwen3.6 Max Preview","author":"qwen","authorDisplay":"Qwen","description":"Qwen3.6-Max-Preview is a proprietary frontier model from Alibaba Cloud built on a sparse mixture-of-experts architecture with approximately 1 trillion total parameters. It is optimized for agentic coding, tool use, and...","shortDescription":"Qwen3.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":94,"createdAt":"2026-04-27T03:24:02.000Z","group":"qwen/qwen3.6-max-preview-20260420","tier":"pro"},{"slug":"qwen/qwen3.6-27b","name":"Qwen: Qwen3.6 27B","shortName":"Qwen3.6 27B","author":"qwen","authorDisplay":"Qwen","description":"Qwen3.6 27B is a dense 27-billion-parameter language model from the Qwen Team at Alibaba, released in April 2026. It features hybrid multimodal capabilities — accepting text, image, and video inputs...","shortDescription":"Qwen3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":95,"createdAt":"2026-04-27T01:57:44.000Z","group":"qwen/qwen3.6-27b-20260422","tier":"basic"},{"slug":"openai/gpt-5.5","name":"OpenAI: GPT-5.5","shortName":"GPT-5.5","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.5 is OpenAI’s frontier model designed for complex professional workloads, building on GPT-5.4 with stronger reasoning, higher reliability, and improved token efficiency on hard tasks. It features a 1M+ token...","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":1050000,"supportsReasoning":true,"ranking":96,"createdAt":"2026-04-24T17:31:33.000Z","group":"openai/gpt-5.5-20260423","tier":"ultimate"},{"slug":"deepseek/deepseek-v4-pro","name":"DeepSeek: DeepSeek V4 Pro","shortName":"DeepSeek V4 Pro","author":"deepseek","authorDisplay":"DeepSeek","description":"DeepSeek V4 Pro is a large-scale Mixture-of-Experts model from DeepSeek with 1.6T total parameters and 49B activated parameters, supporting a 1M-token context window. It is designed for advanced reasoning, coding,...","shortDescription":"DeepSeek V4 Pro is a large-scale Mixture-of-Experts model from DeepSeek with 1.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":97,"createdAt":"2026-04-24T03:17:59.000Z","group":"deepseek/deepseek-v4-pro-20260423","tier":"pro"},{"slug":"deepseek/deepseek-v4-flash","name":"DeepSeek: DeepSeek V4 Flash","shortName":"DeepSeek V4 Flash","author":"deepseek","authorDisplay":"DeepSeek","description":"DeepSeek V4 Flash is an efficiency-optimized Mixture-of-Experts model from DeepSeek with 284B total parameters and 13B activated parameters, supporting a 1M-token context window. It is designed for fast inference and...","shortDescription":"DeepSeek V4 Flash is an efficiency-optimized Mixture-of-Experts model from DeepSeek with 284B total parameters and 13B activated parameters, supporting a 1M-...","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":98,"createdAt":"2026-04-24T03:17:46.000Z","group":"deepseek/deepseek-v4-flash-20260423","tier":"basic"},{"slug":"google/veo-3.1-fast","name":"Google: Veo 3.1 Fast","shortName":"Veo 3.1 Fast","author":"google","authorDisplay":"Google","description":"Google's mid-tier video generation model balancing speed and quality. Veo 3.1 Fast generates high-quality video from text or image prompts with native synchronized audio, offering faster turnaround than Veo 3.1...","shortDescription":"Google's mid-tier video generation model balancing speed and quality.","categories":["video","multimodal"],"inputModalities":["text","image"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":99,"createdAt":"2026-04-24T01:37:46.000Z","group":"google/veo-3.1-fast-20260320","tier":"pro"},{"slug":"google/veo-3.1-lite","name":"Google: Veo 3.1 Lite","shortName":"Veo 3.1 Lite","author":"google","authorDisplay":"Google","description":"Google's most cost-effective video generation model, designed for high-volume applications and rapid iteration. Veo 3.1 Lite generates 720p and 1080p video from text or image prompts with native synchronized audio...","shortDescription":"Google's most cost-effective video generation model, designed for high-volume applications and rapid iteration.","categories":["video","multimodal"],"inputModalities":["text","image"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":100,"createdAt":"2026-04-23T21:13:38.000Z","group":"google/veo-3.1-lite-20260331","tier":"pro"},{"slug":"inclusionai/ling-2.6-1t","name":"inclusionAI: Ling-2.6-1T","shortName":"Ling-2.6-1T","author":"inclusionai","authorDisplay":"Inclusionai","description":"Ling-2.6-1T is an instant (instruct) model from inclusionAI and the company’s trillion-parameter flagship, designed for real-world agents that require fast execution and high efficiency at scale. It uses a “fast...","shortDescription":"Ling-2.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":101,"createdAt":"2026-04-23T12:43:58.000Z","group":"inclusionai/ling-2.6-1t-20260423","tier":"basic"},{"slug":"tencent/hy3-preview","name":"Tencent: Hy3 preview","shortName":"Hy3 preview","author":"tencent","authorDisplay":"Tencent","description":"Hy3 preview is a high-efficiency Mixture-of-Experts model from Tencent designed for agentic workflows and production use. It supports configurable reasoning levels across disabled, low, and high modes, allowing it to...","shortDescription":"Hy3 preview is a high-efficiency Mixture-of-Experts model from Tencent designed for agentic workflows and production use.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":102,"createdAt":"2026-04-22T17:15:50.000Z","group":"tencent/hy3-preview-20260421","tier":"basic"},{"slug":"xiaomi/mimo-v2.5-pro","name":"Xiaomi: MiMo-V2.5-Pro","shortName":"MiMo-V2.5-Pro","author":"xiaomi","authorDisplay":"Xiaomi","description":"MiMo-V2.5-Pro is Xiaomi’s flagship model, delivering strong performance in general agentic capabilities, complex software engineering, and long-horizon tasks, with top rankings on benchmarks such as ClawEval, GDPVal, and SWE-bench Pro....","shortDescription":"MiMo-V2.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1050000,"supportsReasoning":true,"ranking":103,"createdAt":"2026-04-22T16:11:13.000Z","group":"xiaomi/mimo-v2.5-pro-20260422","tier":"pro"},{"slug":"xiaomi/mimo-v2.5","name":"Xiaomi: MiMo-V2.5","shortName":"MiMo-V2.5","author":"xiaomi","authorDisplay":"Xiaomi","description":"MiMo-V2.5 is a native omnimodal model by Xiaomi. It delivers Pro-level agentic performance at roughly half the inference cost, while surpassing MiMo-V2-Omni in multimodal perception across image and video understanding...","shortDescription":"MiMo-V2.","categories":["text","multimodal","reasoning"],"inputModalities":["text","audio","image","video"],"outputModalities":["text"],"contextLength":1050000,"supportsReasoning":true,"ranking":104,"createdAt":"2026-04-22T16:11:09.000Z","group":"xiaomi/mimo-v2.5-20260422","tier":"basic"},{"slug":"inclusionai/ling-2.6-flash","name":"inclusionAI: Ling-2.6-flash","shortName":"Ling-2.6-flash","author":"inclusionai","authorDisplay":"Inclusionai","description":"Ling-2.6-flash is an instant (instruct) model from inclusionAI with 104B total parameters and 7.4B active parameters, designed for real-world agents that require fast responses, strong execution, and high token efficiency....","shortDescription":"Ling-2.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":105,"createdAt":"2026-04-21T18:24:46.000Z","group":"inclusionai/ling-2.6-flash-20260421","tier":"basic"},{"slug":"~anthropic/claude-opus-latest","name":"Anthropic: Claude Opus Latest","shortName":"Claude Opus Latest","author":"~anthropic","authorDisplay":"~anthropic","description":"This model always redirects to the latest model in the Claude Opus family.","shortDescription":"This model always redirects to the latest model in the Claude Opus family.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":106,"createdAt":"2026-04-21T18:16:01.000Z","group":"~anthropic/claude-opus-latest","tier":"ultimate"},{"slug":"openrouter/pareto-code","name":"Pareto Code Router","shortName":"Pareto Code Router","author":"openrouter","authorDisplay":"Openrouter","description":"The Pareto Router maintains a tiered shortlist of strong coding models, ranked by [Artificial Analysis](https://artificialanalysis.ai/) coding percentiles. Set min_coding_score between 0 and 1 on the [pareto-router plugin](https://openrouter.ai/docs/guides/routing/routers/pareto-router#the-min_coding_score-parameter) to control how...","shortDescription":"The Pareto Router maintains a tiered shortlist of strong coding models, ranked by [Artificial Analysis](https://artificialanalysis.","categories":["text","coding"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":2000000,"supportsReasoning":false,"ranking":107,"createdAt":"2026-04-21T05:05:00.000Z","group":"openrouter/pareto-code","tier":"basic"},{"slug":"kwaivgi/kling-video-o1","name":"Kling: Video O1","shortName":"Video O1","author":"kwaivgi","authorDisplay":"Kwaivgi","description":"Kling Video O1 is a video generation model from Kuaishou. It supports text and image inputs with video output, enabling text-to-video and image-to-video workflows. It is suited for cinematic content...","shortDescription":"Kling Video O1 is a video generation model from Kuaishou.","categories":["video","multimodal"],"inputModalities":["text","image"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":108,"createdAt":"2026-04-20T17:06:17.000Z","group":"kwaivgi/kling-video-o1-20260420","tier":"pro"},{"slug":"minimax/hailuo-2.3","name":"MiniMax: Hailuo 2.3","shortName":"Hailuo 2.3","author":"minimax","authorDisplay":"Minimax","description":"Hailuo 2.3 is a video generation model from MiniMax. It accepts text prompts and reference images as input and generates video output, supporting both text-to-video and image-to-video workflows. It is...","shortDescription":"Hailuo 2.","categories":["video","multimodal"],"inputModalities":["text","image"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":109,"createdAt":"2026-04-20T16:32:20.000Z","group":"minimax/hailuo-2.3-20260420","tier":"pro"},{"slug":"moonshotai/kimi-k2.6","name":"MoonshotAI: Kimi K2.6","shortName":"Kimi K2.6","author":"moonshotai","authorDisplay":"Moonshotai","description":"Kimi K2.6 is Moonshot AI's next-generation multimodal model, designed for long-horizon coding, coding-driven UI/UX generation, and multi-agent orchestration. It handles complex end-to-end coding tasks across Python, Rust, and Go, and...","shortDescription":"Kimi K2.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":110,"createdAt":"2026-04-20T15:36:42.000Z","group":"moonshotai/kimi-k2.6-20260420","tier":"pro"},{"slug":"anthropic/claude-opus-4.7","name":"Anthropic: Claude Opus 4.7","shortName":"Claude Opus 4.7","author":"anthropic","authorDisplay":"Anthropic","description":"Opus 4.7 is the next generation of Anthropic's Opus family, built for long-running, asynchronous agents. Building on the coding and agentic strengths of Opus 4.6, it delivers stronger performance on...","shortDescription":"Opus 4.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":111,"createdAt":"2026-04-16T14:51:40.000Z","group":"anthropic/claude-4.7-opus-20260416","tier":"ultimate"},{"slug":"alibaba/wan-2.7","name":"Alibaba: Wan 2.7","shortName":"Wan 2.7","author":"alibaba","authorDisplay":"Alibaba","description":"Wan 2.7 is a video generation model from Alibaba. It supports text-to-video, image-to-video with first and last frame control, and reference-to-video, where multiple reference images guide the style and content...","shortDescription":"Wan 2.","categories":["video","multimodal"],"inputModalities":["text","image"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":112,"createdAt":"2026-04-15T00:02:42.000Z","group":"alibaba/wan-2.7-20260414","tier":"pro"},{"slug":"bytedance/seedance-2.0","name":"ByteDance: Seedance 2.0","shortName":"Seedance 2.0","author":"bytedance","authorDisplay":"ByteDance","description":"Seedance 2.0 is a video generation model from ByteDance. It supports text-to-video, image-to-video with first and last frame control, and multimodal reference-to-video. It is particularly strong at preserving character consistency,...","shortDescription":"Seedance 2.","categories":["video","multimodal"],"inputModalities":["text","image","video","audio"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":113,"createdAt":"2026-04-15T00:02:42.000Z","group":"bytedance/seedance-2.0-20260414","tier":"pro"},{"slug":"bytedance/seedance-2.0-fast","name":"ByteDance: Seedance 2.0 Fast","shortName":"Seedance 2.0 Fast","author":"bytedance","authorDisplay":"ByteDance","description":"Seedance 2.0 Fast is a video generation model from ByteDance. It supports text-to-video, image-to-video with first and last frame control, and multimodal reference-to-video. It prioritizes generation speed and lower cost...","shortDescription":"Seedance 2.","categories":["video","multimodal"],"inputModalities":["text","image","video","audio"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":114,"createdAt":"2026-04-15T00:02:42.000Z","group":"bytedance/seedance-2.0-fast-20260414","tier":"pro"},{"slug":"z-ai/glm-5.1","name":"Z.ai: GLM 5.1","shortName":"GLM 5.1","author":"z-ai","authorDisplay":"Z ai","description":"GLM-5.1 delivers a major leap in coding capability, with particularly significant gains in handling long-horizon tasks. Unlike previous models built around minute-level interactions, GLM-5.1 can work independently and continuously on...","shortDescription":"GLM-5.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":204800,"supportsReasoning":true,"ranking":115,"createdAt":"2026-04-07T16:07:05.000Z","group":"z-ai/glm-5.1-20260406","tier":"pro"},{"slug":"google/gemma-4-26b-a4b-it","name":"Google: Gemma 4 26B A4B","shortName":"Gemma 4 26B A4B","author":"google","authorDisplay":"Google","description":"Gemma 4 26B A4B IT is an instruction-tuned Mixture-of-Experts (MoE) model from Google DeepMind. Despite 25.2B total parameters, only 3.8B activate per token during inference — delivering near-31B quality at...","shortDescription":"Gemma 4 26B A4B IT is an instruction-tuned Mixture-of-Experts (MoE) model from Google DeepMind.","categories":["text","multimodal","reasoning"],"inputModalities":["image","text","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":116,"createdAt":"2026-04-03T14:53:09.000Z","group":"google/gemma-4-26b-a4b-it-20260403","tier":"basic"},{"slug":"google/gemma-4-26b-a4b-it:free","name":"Google: Gemma 4 26B A4B","shortName":"Gemma 4 26B A4B","author":"google","authorDisplay":"Google","description":"Gemma 4 26B A4B IT is an instruction-tuned Mixture-of-Experts (MoE) model from Google DeepMind. Despite 25.2B total parameters, only 3.8B activate per token during inference — delivering near-31B quality at...","shortDescription":"Gemma 4 26B A4B IT is an instruction-tuned Mixture-of-Experts (MoE) model from Google DeepMind.","categories":["text","multimodal","reasoning"],"inputModalities":["image","text","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":117,"createdAt":"2026-04-03T14:53:09.000Z","group":"google/gemma-4-26b-a4b-it-20260403","tier":"basic"},{"slug":"google/gemma-4-31b-it","name":"Google: Gemma 4 31B","shortName":"Gemma 4 31B","author":"google","authorDisplay":"Google","description":"Gemma 4 31B Instruct is Google DeepMind's 30.7B dense multimodal model supporting text and image input with text output. Features a 256K token context window, configurable thinking/reasoning mode, native function...","shortDescription":"Gemma 4 31B Instruct is Google DeepMind's 30.","categories":["text","multimodal","reasoning"],"inputModalities":["image","text","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":118,"createdAt":"2026-04-02T16:48:06.000Z","group":"google/gemma-4-31b-it-20260402","tier":"basic"},{"slug":"google/gemma-4-31b-it:free","name":"Google: Gemma 4 31B","shortName":"Gemma 4 31B","author":"google","authorDisplay":"Google","description":"Gemma 4 31B Instruct is Google DeepMind's 30.7B dense multimodal model supporting text and image input with text output. Features a 256K token context window, configurable thinking/reasoning mode, native function...","shortDescription":"Gemma 4 31B Instruct is Google DeepMind's 30.","categories":["text","multimodal","reasoning"],"inputModalities":["image","text","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":119,"createdAt":"2026-04-02T16:48:06.000Z","group":"google/gemma-4-31b-it-20260402","tier":"basic"},{"slug":"qwen/qwen3.6-plus","name":"Qwen: Qwen3.6 Plus","shortName":"Qwen3.6 Plus","author":"qwen","authorDisplay":"Qwen","description":"Qwen 3.6 Plus builds on a hybrid architecture that combines efficient linear attention with sparse mixture-of-experts routing, enabling strong scalability and high-performance inference. Compared to the 3.5 series, it delivers...","shortDescription":"Qwen 3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":120,"createdAt":"2026-04-02T12:39:17.000Z","group":"qwen/qwen3.6-plus-04-02","tier":"pro"},{"slug":"z-ai/glm-5v-turbo","name":"Z.ai: GLM 5V Turbo","shortName":"GLM 5V Turbo","author":"z-ai","authorDisplay":"Z ai","description":"GLM-5V-Turbo is Z.ai’s first native multimodal agent foundation model, built for vision-based coding and agent-driven tasks. It natively handles image, video, and text inputs, excels at long-horizon planning, complex coding,...","shortDescription":"GLM-5V-Turbo is Z.","categories":["text","multimodal","reasoning"],"inputModalities":["image","text","video"],"outputModalities":["text"],"contextLength":202752,"supportsReasoning":true,"ranking":121,"createdAt":"2026-04-01T16:37:38.000Z","group":"z-ai/glm-5v-turbo-20260401","tier":"pro"},{"slug":"arcee-ai/trinity-large-thinking","name":"Arcee AI: Trinity Large Thinking","shortName":"Trinity Large Thinking","author":"arcee-ai","authorDisplay":"Arcee ai","description":"Trinity Large Thinking is a powerful open source reasoning model from the team at Arcee AI. It shows strong performance in PinchBench, agentic workloads, and reasoning tasks. Launch video: https://youtu.be/Gc82AXLa0Rg?si=4RLn6WBz33qT--B7...","shortDescription":"Trinity Large Thinking is a powerful open source reasoning model from the team at Arcee AI.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":122,"createdAt":"2026-04-01T15:45:18.000Z","group":"arcee-ai/trinity-large-thinking","tier":"basic"},{"slug":"x-ai/grok-4.20-multi-agent","name":"xAI: Grok 4.20 Multi-Agent","shortName":"Grok 4.20 Multi-Agent","author":"x-ai","authorDisplay":"xAI","description":"Grok 4.20 Multi-Agent is a variant of xAI’s Grok 4.20 designed for collaborative, agent-based workflows. Multiple agents operate in parallel to conduct deep research, coordinate tool use, and synthesize information...","shortDescription":"Grok 4.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":2000000,"supportsReasoning":true,"ranking":123,"createdAt":"2026-03-31T17:45:58.000Z","group":"x-ai/grok-4.20-multi-agent-20260309","tier":"pro"},{"slug":"x-ai/grok-4.20","name":"xAI: Grok 4.20","shortName":"Grok 4.20","author":"x-ai","authorDisplay":"xAI","description":"Grok 4.20 is a reasoning model from xAI with industry-leading speed and agentic tool calling capabilities. It combines the lowest hallucination rate on the market with strict prompt adherance, delivering...","shortDescription":"Grok 4.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":2000000,"supportsReasoning":true,"ranking":124,"createdAt":"2026-03-31T17:43:39.000Z","group":"x-ai/grok-4.20-20260309","tier":"pro"},{"slug":"google/lyria-3-pro-preview","name":"Google: Lyria 3 Pro Preview","shortName":"Lyria 3 Pro Preview","author":"google","authorDisplay":"Google","description":"Full-length songs are priced at $0.08 per song. Lyria 3 is Google's family of music generation models, available through the Gemini API. With Lyria 3, you can generate high-quality, 48kHz...","shortDescription":"Full-length songs are priced at $0.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text","audio"],"contextLength":1048576,"supportsReasoning":false,"ranking":125,"createdAt":"2026-03-30T21:48:06.000Z","group":"google/lyria-3-pro-preview-20260330","tier":"basic"},{"slug":"google/lyria-3-clip-preview","name":"Google: Lyria 3 Clip Preview","shortName":"Lyria 3 Clip Preview","author":"google","authorDisplay":"Google","description":"30 second duration clips are priced at $0.04 per clip. Lyria 3 is Google's family of music generation models, available through the Gemini API. With Lyria 3, you can generate...","shortDescription":"30 second duration clips are priced at $0.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text","audio"],"contextLength":1048576,"supportsReasoning":false,"ranking":126,"createdAt":"2026-03-30T21:47:35.000Z","group":"google/lyria-3-clip-preview-20260330","tier":"basic"},{"slug":"alibaba/wan-2.6","name":"Alibaba: Wan 2.6","shortName":"Wan 2.6","author":"alibaba","authorDisplay":"Alibaba","description":"Alibaba's most advanced video generation model, supporting over 10 visual creation capabilities in a unified system. Wan 2.6 generates 1080p video at 24fps from text, images, reference videos, or audio,...","shortDescription":"Alibaba's most advanced video generation model, supporting over 10 visual creation capabilities in a unified system.","categories":["video","multimodal"],"inputModalities":["text","image"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":127,"createdAt":"2026-03-28T00:53:10.000Z","group":"alibaba/wan-2.6-20260327","tier":"pro"},{"slug":"kwaipilot/kat-coder-pro-v2","name":"Kwaipilot: KAT-Coder-Pro V2","shortName":"KAT-Coder-Pro V2","author":"kwaipilot","authorDisplay":"Kwaipilot","description":"KAT-Coder-Pro V2 is the latest high-performance model in KwaiKAT’s KAT-Coder series, designed for complex enterprise-grade software engineering and SaaS integration. It builds on the agentic coding strengths of earlier versions,...","shortDescription":"KAT-Coder-Pro V2 is the latest high-performance model in KwaiKAT’s KAT-Coder series, designed for complex enterprise-grade software engineering and SaaS inte...","categories":["text","coding"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":128,"createdAt":"2026-03-27T22:08:30.000Z","group":"kwaipilot/kat-coder-pro-v2-20260327","tier":"basic"},{"slug":"bytedance/seedance-1-5-pro","name":"ByteDance: Seedance 1.5 Pro","shortName":"Seedance 1.5 Pro","author":"bytedance","authorDisplay":"ByteDance","description":"ByteDance's next-generation audio-visual generation model with a 4.5B parameter Dual-Branch Diffusion Transformer architecture. Seedance 1.5 Pro generates video and audio simultaneously in a single unified pass — eliminating the timing...","shortDescription":"ByteDance's next-generation audio-visual generation model with a 4.","categories":["video","multimodal"],"inputModalities":["text","image"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":129,"createdAt":"2026-03-23T14:53:28.000Z","group":"bytedance/seedance-1-5-pro-20260320","tier":"pro"},{"slug":"openai/sora-2-pro","name":"OpenAI: Sora 2 Pro","shortName":"Sora 2 Pro","author":"openai","authorDisplay":"OpenAI","description":"OpenAI's flagship video generation model, delivering production-quality video with physics-accurate motion, synchronized audio, and world-state persistence across shots. Sora 2 Pro follows intricate multi-shot instructions while maintaining consistent spatial relationships...","shortDescription":"OpenAI's flagship video generation model, delivering production-quality video with physics-accurate motion, synchronized audio, and world-state persistence a...","categories":["video","multimodal"],"inputModalities":["text","image"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":130,"createdAt":"2026-03-23T14:52:01.000Z","group":"openai/sora-2-pro-20260320","tier":"pro"},{"slug":"google/veo-3.1","name":"Google: Veo 3.1","shortName":"Veo 3.1","author":"google","authorDisplay":"Google","description":"Google's state-of-the-art video generation model, built for maximum visual fidelity in final production cuts. Veo 3.1 generates high-quality 1080p video from text or image prompts with native synchronized audio —...","shortDescription":"Google's state-of-the-art video generation model, built for maximum visual fidelity in final production cuts.","categories":["video","multimodal"],"inputModalities":["text","image"],"outputModalities":["video"],"contextLength":0,"supportsReasoning":false,"ranking":131,"createdAt":"2026-03-23T14:45:48.000Z","group":"google/veo-3.1-20260320","tier":"pro"},{"slug":"rekaai/reka-edge","name":"Reka Edge","shortName":"Reka Edge","author":"rekaai","authorDisplay":"Rekaai","description":"Reka Edge is an extremely efficient 7B multimodal vision-language model that accepts image/video+text inputs and generates text outputs. This model is optimized specifically to deliver industry-leading performance in image understanding,...","shortDescription":"Reka Edge is an extremely efficient 7B multimodal vision-language model that accepts image/video+text inputs and generates text outputs.","categories":["text","multimodal","reasoning"],"inputModalities":["image","text","video"],"outputModalities":["text"],"contextLength":16384,"supportsReasoning":true,"ranking":132,"createdAt":"2026-03-20T17:16:05.000Z","group":"rekaai/reka-edge-2603","tier":"basic"},{"slug":"minimax/minimax-m2.7","name":"MiniMax: MiniMax M2.7","shortName":"MiniMax M2.7","author":"minimax","authorDisplay":"Minimax","description":"MiniMax-M2.7 is a next-generation large language model designed for autonomous, real-world productivity and continuous improvement. Built to actively participate in its own evolution, M2.7 integrates advanced agentic capabilities through multi-agent...","shortDescription":"MiniMax-M2.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":204800,"supportsReasoning":true,"ranking":133,"createdAt":"2026-03-18T12:24:57.000Z","group":"minimax/minimax-m2.7-20260318","tier":"basic"},{"slug":"openai/gpt-5.4-nano","name":"OpenAI: GPT-5.4 Nano","shortName":"GPT-5.4 Nano","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.4 nano is the most lightweight and cost-efficient variant of the GPT-5.4 family, optimized for speed-critical and high-volume tasks. It supports text and image inputs and is designed for low-latency...","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":400000,"supportsReasoning":true,"ranking":134,"createdAt":"2026-03-17T11:49:47.000Z","group":"openai/gpt-5.4-nano-20260317","tier":"basic"},{"slug":"openai/gpt-5.4-mini","name":"OpenAI: GPT-5.4 Mini","shortName":"GPT-5.4 Mini","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.4 mini brings the core capabilities of GPT-5.4 to a faster, more efficient model optimized for high-throughput workloads. It supports text and image inputs with strong performance across reasoning, coding,...","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":400000,"supportsReasoning":true,"ranking":135,"createdAt":"2026-03-17T11:49:38.000Z","group":"openai/gpt-5.4-mini-20260317","tier":"pro"},{"slug":"mistralai/mistral-small-2603","name":"Mistral: Mistral Small 4","shortName":"Mistral Small 4","author":"mistralai","authorDisplay":"Mistral AI","description":"Mistral Small 4 is the next major release in the Mistral Small family, unifying the capabilities of several flagship Mistral models into a single system. It combines strong reasoning from...","shortDescription":"Mistral Small 4 is the next major release in the Mistral Small family, unifying the capabilities of several flagship Mistral models into a single system.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":136,"createdAt":"2026-03-16T21:14:45.000Z","group":"mistralai/mistral-small-2603","tier":"basic"},{"slug":"z-ai/glm-5-turbo","name":"Z.ai: GLM 5 Turbo","shortName":"GLM 5 Turbo","author":"z-ai","authorDisplay":"Z ai","description":"GLM-5 Turbo is a new model from Z.ai designed for fast inference and strong performance in agent-driven environments such as OpenClaw scenarios. It is deeply optimized for real-world agent workflows...","shortDescription":"GLM-5 Turbo is a new model from Z.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":202752,"supportsReasoning":true,"ranking":137,"createdAt":"2026-03-15T14:06:13.000Z","group":"z-ai/glm-5-turbo-20260315","tier":"pro"},{"slug":"nvidia/nemotron-3-super-120b-a12b","name":"NVIDIA: Nemotron 3 Super","shortName":"Nemotron 3 Super","author":"nvidia","authorDisplay":"NVIDIA","description":"NVIDIA Nemotron 3 Super is a 120B-parameter open hybrid MoE model, activating just 12B parameters for maximum compute efficiency and accuracy in complex multi-agent applications. Built on a hybrid Mamba-Transformer...","shortDescription":"NVIDIA Nemotron 3 Super is a 120B-parameter open hybrid MoE model, activating just 12B parameters for maximum compute efficiency and accuracy in complex mult...","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":138,"createdAt":"2026-03-11T16:07:19.000Z","group":"nvidia/nemotron-3-super-120b-a12b-20230311","tier":"basic"},{"slug":"nvidia/nemotron-3-super-120b-a12b:free","name":"NVIDIA: Nemotron 3 Super","shortName":"Nemotron 3 Super","author":"nvidia","authorDisplay":"NVIDIA","description":"NVIDIA Nemotron 3 Super is a 120B-parameter open hybrid MoE model, activating just 12B parameters for maximum compute efficiency and accuracy in complex multi-agent applications. Built on a hybrid Mamba-Transformer...","shortDescription":"NVIDIA Nemotron 3 Super is a 120B-parameter open hybrid MoE model, activating just 12B parameters for maximum compute efficiency and accuracy in complex mult...","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":139,"createdAt":"2026-03-11T16:07:19.000Z","group":"nvidia/nemotron-3-super-120b-a12b-20230311","tier":"basic"},{"slug":"bytedance-seed/seed-2.0-lite","name":"ByteDance Seed: Seed-2.0-Lite","shortName":"Seed-2.0-Lite","author":"bytedance-seed","authorDisplay":"ByteDance","description":"Seed-2.0-Lite is a versatile, cost‑efficient enterprise workhorse that delivers strong multimodal and agent capabilities while offering noticeably lower latency, making it a practical default choice for most production workloads across...","shortDescription":"Seed-2.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":140,"createdAt":"2026-03-10T15:40:31.000Z","group":"bytedance-seed/seed-2.0-lite-20260309","tier":"basic"},{"slug":"qwen/qwen3.5-9b","name":"Qwen: Qwen3.5-9B","shortName":"Qwen3.5-9B","author":"qwen","authorDisplay":"Qwen","description":"Qwen3.5-9B is a multimodal foundation model from the Qwen3.5 family, designed to deliver strong reasoning, coding, and visual understanding in an efficient 9B-parameter architecture. It uses a unified vision-language design...","shortDescription":"Qwen3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":141,"createdAt":"2026-03-10T14:19:56.000Z","group":"qwen/qwen3.5-9b-20260310","tier":"basic"},{"slug":"openai/gpt-5.4","name":"OpenAI: GPT-5.4","shortName":"GPT-5.4","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.4 is OpenAI’s latest frontier model, unifying the Codex and GPT lines into a single system. It features a 1M+ token context window (922K input, 128K output) with support for...","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":1050000,"supportsReasoning":true,"ranking":142,"createdAt":"2026-03-05T18:12:32.000Z","group":"openai/gpt-5.4-20260305","tier":"pro"},{"slug":"inception/mercury-2","name":"Inception: Mercury 2","shortName":"Mercury 2","author":"inception","authorDisplay":"Inception","description":"Mercury 2 is an extremely fast reasoning LLM, and the first reasoning diffusion LLM (dLLM). Instead of generating tokens sequentially, Mercury 2 produces and refines multiple tokens in parallel, achieving...","shortDescription":"Mercury 2 is an extremely fast reasoning LLM, and the first reasoning diffusion LLM (dLLM).","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":true,"ranking":143,"createdAt":"2026-03-04T14:57:55.000Z","group":"inception/mercury-2-20260304","tier":"basic"},{"slug":"openai/gpt-5.3-chat","name":"OpenAI: GPT-5.3 Chat","shortName":"GPT-5.3 Chat","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.3 Chat is an update to ChatGPT's most-used model that makes everyday conversations smoother, more useful, and more directly helpful. It delivers more accurate answers with better contextualization and significantly...","shortDescription":"GPT-5.","categories":["text","multimodal"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":144,"createdAt":"2026-03-03T18:54:21.000Z","group":"openai/gpt-5.3-chat-20260303","tier":"pro"},{"slug":"google/gemini-3.1-flash-lite-preview","name":"Google: Gemini 3.1 Flash Lite Preview","shortName":"Gemini 3.1 Flash Lite Preview","author":"google","authorDisplay":"Google","description":"Gemini 3.1 Flash Lite Preview is Google's high-efficiency model optimized for high-volume use cases. It outperforms Gemini 2.5 Flash Lite on overall quality and approaches Gemini 2.5 Flash performance across...","shortDescription":"Gemini 3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video","file","audio"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":145,"createdAt":"2026-03-03T04:37:53.000Z","group":"google/gemini-3.1-flash-lite-preview-20260303","tier":"basic"},{"slug":"bytedance-seed/seed-2.0-mini","name":"ByteDance Seed: Seed-2.0-Mini","shortName":"Seed-2.0-Mini","author":"bytedance-seed","authorDisplay":"ByteDance","description":"Seed-2.0-mini targets latency-sensitive, high-concurrency, and cost-sensitive scenarios, emphasizing fast response and flexible inference deployment. It delivers performance comparable to ByteDance-Seed-1.6, supports 256k context, four reasoning effort modes (minimal/low/medium/high), multimodal understanding,...","shortDescription":"Seed-2.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":146,"createdAt":"2026-02-26T18:38:27.000Z","group":"bytedance-seed/seed-2.0-mini-20260224","tier":"basic"},{"slug":"google/gemini-3.1-flash-image-preview","name":"Google: Nano Banana 2 (Gemini 3.1 Flash Image Preview)","shortName":"Nano Banana 2 (Gemini 3.1 Flash Image Preview)","author":"google","authorDisplay":"Google","description":"Gemini 3.1 Flash Image Preview, a.k.a. \"Nano Banana 2,\" is Google’s latest state of the art image generation and editing model, delivering Pro-level visual quality at Flash speed. It combines...","shortDescription":"Gemini 3.","categories":["image","text","multimodal","reasoning"],"inputModalities":["image","text"],"outputModalities":["image","text"],"contextLength":131072,"supportsReasoning":true,"ranking":147,"createdAt":"2026-02-26T15:25:58.000Z","group":"google/gemini-3.1-flash-image-preview-20260226","tier":"pro"},{"slug":"qwen/qwen3.5-35b-a3b","name":"Qwen: Qwen3.5-35B-A3B","shortName":"Qwen3.5-35B-A3B","author":"qwen","authorDisplay":"Qwen","description":"The Qwen3.5 Series 35B-A3B is a native vision-language model designed with a hybrid architecture that integrates linear attention mechanisms and a sparse mixture-of-experts model, achieving higher inference efficiency. Its overall...","shortDescription":"The Qwen3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":148,"createdAt":"2026-02-25T21:10:22.000Z","group":"qwen/qwen3.5-35b-a3b-20260224","tier":"basic"},{"slug":"qwen/qwen3.5-27b","name":"Qwen: Qwen3.5-27B","shortName":"Qwen3.5-27B","author":"qwen","authorDisplay":"Qwen","description":"The Qwen3.5 27B native vision-language Dense model incorporates a linear attention mechanism, delivering fast response times while balancing inference speed and performance. Its overall capabilities are comparable to those of...","shortDescription":"The Qwen3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":149,"createdAt":"2026-02-25T21:10:10.000Z","group":"qwen/qwen3.5-27b-20260224","tier":"basic"},{"slug":"qwen/qwen3.5-122b-a10b","name":"Qwen: Qwen3.5-122B-A10B","shortName":"Qwen3.5-122B-A10B","author":"qwen","authorDisplay":"Qwen","description":"The Qwen3.5 122B-A10B native vision-language model is built on a hybrid architecture that integrates a linear attention mechanism with a sparse mixture-of-experts model, achieving higher inference efficiency. In terms of...","shortDescription":"The Qwen3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":150,"createdAt":"2026-02-25T21:09:49.000Z","group":"qwen/qwen3.5-122b-a10b-20260224","tier":"basic"},{"slug":"qwen/qwen3.5-flash-02-23","name":"Qwen: Qwen3.5-Flash","shortName":"Qwen3.5-Flash","author":"qwen","authorDisplay":"Qwen","description":"The Qwen3.5 native vision-language Flash models are built on a hybrid architecture that integrates a linear attention mechanism with a sparse mixture-of-experts model, achieving higher inference efficiency. Compared to the...","shortDescription":"The Qwen3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":151,"createdAt":"2026-02-25T21:09:36.000Z","group":"qwen/qwen3.5-flash-20260224","tier":"basic"},{"slug":"google/gemini-3.1-pro-preview-customtools","name":"Google: Gemini 3.1 Pro Preview Custom Tools","shortName":"Gemini 3.1 Pro Preview Custom Tools","author":"google","authorDisplay":"Google","description":"Gemini 3.1 Pro Preview Custom Tools is a variant of Gemini 3.1 Pro that improves tool selection behavior by preventing overuse of a general bash tool when more efficient third-party...","shortDescription":"Gemini 3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","audio","image","video","file"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":152,"createdAt":"2026-02-25T18:58:43.000Z","group":"google/gemini-3.1-pro-preview-customtools-20260219","tier":"pro"},{"slug":"openai/gpt-5.3-codex","name":"OpenAI: GPT-5.3-Codex","shortName":"GPT-5.3-Codex","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.3-Codex is OpenAI’s most advanced agentic coding model, combining the frontier software engineering performance of GPT-5.2-Codex with the broader reasoning and professional knowledge capabilities of GPT-5.2. It achieves state-of-the-art results...","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning","coding"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":400000,"supportsReasoning":true,"ranking":153,"createdAt":"2026-02-24T18:52:44.000Z","group":"openai/gpt-5.3-codex-20260224","tier":"pro"},{"slug":"aion-labs/aion-2.0","name":"AionLabs: Aion-2.0","shortName":"Aion-2.0","author":"aion-labs","authorDisplay":"Aion labs","description":"Aion-2.0 is a variant of DeepSeek V3.2 optimized for immersive roleplaying and storytelling. It is particularly strong at introducing tension, crises, and conflict into stories, making narratives feel more engaging....","shortDescription":"Aion-2.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":154,"createdAt":"2026-02-23T21:15:06.000Z","group":"aion-labs/aion-2.0-20260223","tier":"pro"},{"slug":"google/gemini-3.1-pro-preview","name":"Google: Gemini 3.1 Pro Preview","shortName":"Gemini 3.1 Pro Preview","author":"google","authorDisplay":"Google","description":"Gemini 3.1 Pro Preview is Google’s frontier reasoning model, delivering enhanced software engineering performance, improved agentic reliability, and more efficient token usage across complex workflows. Building on the multimodal foundation...","shortDescription":"Gemini 3.","categories":["text","multimodal","reasoning"],"inputModalities":["audio","file","image","text","video"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":155,"createdAt":"2026-02-19T14:00:27.000Z","group":"google/gemini-3.1-pro-preview-20260219","tier":"pro"},{"slug":"anthropic/claude-sonnet-4.6","name":"Anthropic: Claude Sonnet 4.6","shortName":"Claude Sonnet 4.6","author":"anthropic","authorDisplay":"Anthropic","description":"Sonnet 4.6 is Anthropic's most capable Sonnet-class model yet, with frontier performance across coding, agents, and professional work. It excels at iterative development, complex codebase navigation, end-to-end project management with...","shortDescription":"Sonnet 4.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":156,"createdAt":"2026-02-17T15:43:10.000Z","group":"anthropic/claude-4.6-sonnet-20260217","tier":"pro"},{"slug":"qwen/qwen3.5-plus-02-15","name":"Qwen: Qwen3.5 Plus 2026-02-15","shortName":"Qwen3.5 Plus 2026-02-15","author":"qwen","authorDisplay":"Qwen","description":"The Qwen3.5 native vision-language series Plus models are built on a hybrid architecture that integrates linear attention mechanisms with sparse mixture-of-experts models, achieving higher inference efficiency. In a variety of...","shortDescription":"The Qwen3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":157,"createdAt":"2026-02-16T08:10:16.000Z","group":"qwen/qwen3.5-plus-20260216","tier":"basic"},{"slug":"qwen/qwen3.5-397b-a17b","name":"Qwen: Qwen3.5 397B A17B","shortName":"Qwen3.5 397B A17B","author":"qwen","authorDisplay":"Qwen","description":"The Qwen3.5 series 397B-A17B native vision-language model is built on a hybrid architecture that integrates a linear attention mechanism with a sparse mixture-of-experts model, achieving higher inference efficiency. It delivers...","shortDescription":"The Qwen3.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":158,"createdAt":"2026-02-16T06:23:38.000Z","group":"qwen/qwen3.5-397b-a17b-20260216","tier":"pro"},{"slug":"minimax/minimax-m2.5","name":"MiniMax: MiniMax M2.5","shortName":"MiniMax M2.5","author":"minimax","authorDisplay":"Minimax","description":"MiniMax-M2.5 is a SOTA large language model designed for real-world productivity. Trained in a diverse range of complex real-world digital working environments, M2.5 builds upon the coding expertise of M2.1...","shortDescription":"MiniMax-M2.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":204800,"supportsReasoning":true,"ranking":159,"createdAt":"2026-02-12T15:01:42.000Z","group":"minimax/minimax-m2.5-20260211","tier":"basic"},{"slug":"z-ai/glm-5","name":"Z.ai: GLM 5","shortName":"GLM 5","author":"z-ai","authorDisplay":"Z ai","description":"GLM-5 is Z.ai’s flagship open-source foundation model engineered for complex systems design and long-horizon agent workflows. Built for expert developers, it delivers production-grade performance on large-scale programming tasks, rivaling leading...","shortDescription":"GLM-5 is Z.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":204800,"supportsReasoning":true,"ranking":160,"createdAt":"2026-02-11T16:59:42.000Z","group":"z-ai/glm-5-20260211","tier":"pro"},{"slug":"qwen/qwen3-max-thinking","name":"Qwen: Qwen3 Max Thinking","shortName":"Qwen3 Max Thinking","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-Max-Thinking is the flagship reasoning model in the Qwen3 series, designed for high-stakes cognitive tasks that require deep, multi-step reasoning. By significantly scaling model capacity and reinforcement learning compute, it...","shortDescription":"Qwen3-Max-Thinking is the flagship reasoning model in the Qwen3 series, designed for high-stakes cognitive tasks that require deep, multi-step reasoning.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":161,"createdAt":"2026-02-09T21:18:21.000Z","group":"qwen/qwen3-max-thinking-20260123","tier":"pro"},{"slug":"anthropic/claude-opus-4.6","name":"Anthropic: Claude Opus 4.6","shortName":"Claude Opus 4.6","author":"anthropic","authorDisplay":"Anthropic","description":"Opus 4.6 is Anthropic’s strongest model for coding and long-running professional tasks. It is built for agents that operate across entire workflows rather than single prompts, making it especially effective...","shortDescription":"Opus 4.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":162,"createdAt":"2026-02-04T15:30:50.000Z","group":"anthropic/claude-4.6-opus-20260205","tier":"ultimate"},{"slug":"qwen/qwen3-coder-next","name":"Qwen: Qwen3 Coder Next","shortName":"Qwen3 Coder Next","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-Coder-Next is an open-weight causal language model optimized for coding agents and local development workflows. It uses a sparse MoE design with 80B total parameters and only 3B activated per...","shortDescription":"Qwen3-Coder-Next is an open-weight causal language model optimized for coding agents and local development workflows.","categories":["text","coding"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":163,"createdAt":"2026-02-04T00:15:01.000Z","group":"qwen/qwen3-coder-next-2025-02-03","tier":"basic"},{"slug":"sourceful/riverflow-v2-pro","name":"Sourceful: Riverflow V2 Pro","shortName":"Riverflow V2 Pro","author":"sourceful","authorDisplay":"Sourceful","description":"Riverflow V2 Pro is the most powerful variant of Sourceful's Riverflow 2.0 lineup, best for top-tier control and perfect text rendering. The Riverflow 2.0 series represents SOTA performance on image...","shortDescription":"Riverflow V2 Pro is the most powerful variant of Sourceful's Riverflow 2.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":8192,"supportsReasoning":false,"ranking":164,"createdAt":"2026-02-02T16:57:07.000Z","group":"sourceful/riverflow-v2-pro-20260130","tier":"pro"},{"slug":"sourceful/riverflow-v2-fast","name":"Sourceful: Riverflow V2 Fast","shortName":"Riverflow V2 Fast","author":"sourceful","authorDisplay":"Sourceful","description":"Riverflow V2 Fast is the fastest variant of Sourceful's Riverflow 2.0 lineup, best for production deployments and latency-critical workflows. The Riverflow 2.0 series represents SOTA performance on image generation and...","shortDescription":"Riverflow V2 Fast is the fastest variant of Sourceful's Riverflow 2.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":8192,"supportsReasoning":false,"ranking":165,"createdAt":"2026-02-02T16:57:03.000Z","group":"sourceful/riverflow-v2-fast-20260130","tier":"pro"},{"slug":"openrouter/free","name":"Free Models Router","shortName":"Free Models Router","author":"openrouter","authorDisplay":"Openrouter","description":"The simplest way to get free inference. openrouter/free is a router that selects free models at random from the models available on OpenRouter. The router smartly filters for models that...","shortDescription":"The simplest way to get free inference.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":200000,"supportsReasoning":true,"ranking":166,"createdAt":"2026-02-01T03:43:47.000Z","group":"openrouter/free","tier":"basic"},{"slug":"stepfun/step-3.5-flash","name":"StepFun: Step 3.5 Flash","shortName":"Step 3.5 Flash","author":"stepfun","authorDisplay":"Stepfun","description":"Step 3.5 Flash is StepFun's most capable open-source foundation model. Built on a sparse Mixture of Experts (MoE) architecture, it selectively activates only 11B of its 196B parameters per token....","shortDescription":"Step 3.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":167,"createdAt":"2026-01-29T23:12:17.000Z","group":"stepfun/step-3.5-flash","tier":"basic"},{"slug":"moonshotai/kimi-k2.5","name":"MoonshotAI: Kimi K2.5","shortName":"Kimi K2.5","author":"moonshotai","authorDisplay":"Moonshotai","description":"Kimi K2.5 is Moonshot AI's native multimodal model, delivering state-of-the-art visual coding capability and a self-directed agent swarm paradigm. Built on Kimi K2 with continued pretraining over approximately 15T mixed...","shortDescription":"Kimi K2.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":168,"createdAt":"2026-01-27T04:11:16.000Z","group":"moonshotai/kimi-k2.5-0127","tier":"pro"},{"slug":"upstage/solar-pro-3","name":"Upstage: Solar Pro 3","shortName":"Solar Pro 3","author":"upstage","authorDisplay":"Upstage","description":"Solar Pro 3 is Upstage's powerful Mixture-of-Experts (MoE) language model. With 102B total parameters and 12B active parameters per forward pass, it delivers exceptional performance while maintaining computational efficiency. Optimized...","shortDescription":"Solar Pro 3 is Upstage's powerful Mixture-of-Experts (MoE) language model.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":true,"ranking":169,"createdAt":"2026-01-27T02:33:20.000Z","group":"upstage/solar-pro-3","tier":"basic"},{"slug":"minimax/minimax-m2-her","name":"MiniMax: MiniMax M2-her","shortName":"MiniMax M2-her","author":"minimax","authorDisplay":"Minimax","description":"MiniMax M2-her is a dialogue-first large language model built for immersive roleplay, character-driven chat, and expressive multi-turn conversations. Designed to stay consistent in tone and personality, it supports rich message...","shortDescription":"MiniMax M2-her is a dialogue-first large language model built for immersive roleplay, character-driven chat, and expressive multi-turn conversations.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":65536,"supportsReasoning":false,"ranking":170,"createdAt":"2026-01-23T14:07:19.000Z","group":"minimax/minimax-m2-her-20260123","tier":"basic"},{"slug":"writer/palmyra-x5","name":"Writer: Palmyra X5","shortName":"Palmyra X5","author":"writer","authorDisplay":"Writer","description":"Palmyra X5 is Writer's most advanced model, purpose-built for building and scaling AI agents across the enterprise. It delivers industry-leading speed and efficiency on context windows up to 1 million...","shortDescription":"Palmyra X5 is Writer's most advanced model, purpose-built for building and scaling AI agents across the enterprise.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1040000,"supportsReasoning":false,"ranking":171,"createdAt":"2026-01-21T13:57:03.000Z","group":"writer/palmyra-x5-20250428","tier":"pro"},{"slug":"openai/gpt-audio","name":"OpenAI: GPT Audio","shortName":"GPT Audio","author":"openai","authorDisplay":"OpenAI","description":"The gpt-audio model is OpenAI's first generally available audio model. The new snapshot features an upgraded decoder for more natural sounding voices and maintains better voice consistency. Audio is priced...","shortDescription":"The gpt-audio model is OpenAI's first generally available audio model.","categories":["text","multimodal"],"inputModalities":["text","audio"],"outputModalities":["text","audio"],"contextLength":128000,"supportsReasoning":false,"ranking":172,"createdAt":"2026-01-19T22:42:49.000Z","group":"openai/gpt-audio","tier":"pro"},{"slug":"openai/gpt-audio-mini","name":"OpenAI: GPT Audio Mini","shortName":"GPT Audio Mini","author":"openai","authorDisplay":"OpenAI","description":"A cost-efficient version of GPT Audio. The new snapshot features an upgraded decoder for more natural sounding voices and maintains better voice consistency. Input is priced at $0.60 per million...","shortDescription":"A cost-efficient version of GPT Audio.","categories":["text","multimodal"],"inputModalities":["text","audio"],"outputModalities":["text","audio"],"contextLength":128000,"supportsReasoning":false,"ranking":173,"createdAt":"2026-01-19T21:50:19.000Z","group":"openai/gpt-audio-mini","tier":"pro"},{"slug":"z-ai/glm-4.7-flash","name":"Z.ai: GLM 4.7 Flash","shortName":"GLM 4.7 Flash","author":"z-ai","authorDisplay":"Z ai","description":"As a 30B-class SOTA model, GLM-4.7-Flash offers a new option that balances performance and efficiency. It is further optimized for agentic coding use cases, strengthening coding capabilities, long-horizon task planning,...","shortDescription":"As a 30B-class SOTA model, GLM-4.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":202752,"supportsReasoning":true,"ranking":174,"createdAt":"2026-01-19T14:45:13.000Z","group":"z-ai/glm-4.7-flash-20260119","tier":"basic"},{"slug":"black-forest-labs/flux.2-klein-4b","name":"Black Forest Labs: FLUX.2 Klein 4B","shortName":"FLUX.2 Klein 4B","author":"black-forest-labs","authorDisplay":"Black forest labs","description":"FLUX.2 [klein] 4B is the fastest and most cost-effective model in the FLUX.2 family, optimized for high-throughput use cases while maintaining excellent image quality. Pricing is based on the output...","shortDescription":"FLUX.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":40960,"supportsReasoning":false,"ranking":175,"createdAt":"2026-01-14T22:20:28.000Z","group":"black-forest-labs/flux.2-klein-4b","tier":"pro"},{"slug":"openai/gpt-5.2-codex","name":"OpenAI: GPT-5.2-Codex","shortName":"GPT-5.2-Codex","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.2-Codex is an upgraded version of GPT-5.1-Codex optimized for software engineering and coding workflows. It is designed for both interactive development sessions and long, independent execution of complex engineering tasks....","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning","coding"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":400000,"supportsReasoning":true,"ranking":176,"createdAt":"2026-01-14T16:48:35.000Z","group":"openai/gpt-5.2-codex-20260114","tier":"pro"},{"slug":"bytedance-seed/seedream-4.5","name":"ByteDance Seed: Seedream 4.5","shortName":"Seedream 4.5","author":"bytedance-seed","authorDisplay":"ByteDance","description":"Seedream 4.5 is the latest in-house image generation model developed by ByteDance. Compared with Seedream 4.0, it delivers comprehensive improvements, especially in editing consistency, including better preservation of subject details,...","shortDescription":"Seedream 4.","categories":["image","multimodal"],"inputModalities":["image","text"],"outputModalities":["image"],"contextLength":4096,"supportsReasoning":false,"ranking":177,"createdAt":"2025-12-23T19:51:46.000Z","group":"bytedance-seed/seedream-4.5-20251203","tier":"pro"},{"slug":"bytedance-seed/seed-1.6-flash","name":"ByteDance Seed: Seed 1.6 Flash","shortName":"Seed 1.6 Flash","author":"bytedance-seed","authorDisplay":"ByteDance","description":"Seed 1.6 Flash is an ultra-fast multimodal deep thinking model by ByteDance Seed, supporting both text and visual understanding. It features a 256k context window and can generate outputs of...","shortDescription":"Seed 1.","categories":["text","multimodal","reasoning"],"inputModalities":["image","text","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":178,"createdAt":"2025-12-23T15:50:11.000Z","group":"bytedance-seed/seed-1.6-flash-20250625","tier":"basic"},{"slug":"bytedance-seed/seed-1.6","name":"ByteDance Seed: Seed 1.6","shortName":"Seed 1.6","author":"bytedance-seed","authorDisplay":"ByteDance","description":"Seed 1.6 is a general-purpose model released by the ByteDance Seed team. It incorporates multimodal capabilities and adaptive deep thinking with a 256K context window.","shortDescription":"Seed 1.","categories":["text","multimodal","reasoning"],"inputModalities":["image","text","video"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":179,"createdAt":"2025-12-23T15:49:57.000Z","group":"bytedance-seed/seed-1.6-20250625","tier":"basic"},{"slug":"minimax/minimax-m2.1","name":"MiniMax: MiniMax M2.1","shortName":"MiniMax M2.1","author":"minimax","authorDisplay":"Minimax","description":"MiniMax-M2.1 is a lightweight, state-of-the-art large language model optimized for coding, agentic workflows, and modern application development. With only 10 billion activated parameters, it delivers a major jump in real-world...","shortDescription":"MiniMax-M2.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":204800,"supportsReasoning":true,"ranking":180,"createdAt":"2025-12-23T01:56:37.000Z","group":"minimax/minimax-m2.1","tier":"basic"},{"slug":"z-ai/glm-4.7","name":"Z.ai: GLM 4.7","shortName":"GLM 4.7","author":"z-ai","authorDisplay":"Z ai","description":"GLM-4.7 is Z.ai’s latest flagship model, featuring upgrades in two key areas: enhanced programming capabilities and more stable multi-step reasoning/execution. It demonstrates significant improvements in executing complex agent tasks while...","shortDescription":"GLM-4.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":204800,"supportsReasoning":true,"ranking":181,"createdAt":"2025-12-22T04:33:34.000Z","group":"z-ai/glm-4.7-20251222","tier":"pro"},{"slug":"google/gemini-3-flash-preview","name":"Google: Gemini 3 Flash Preview","shortName":"Gemini 3 Flash Preview","author":"google","authorDisplay":"Google","description":"Gemini 3 Flash Preview is a high speed, high value thinking model designed for agentic workflows, multi turn chat, and coding assistance. It delivers near Pro level reasoning and tool...","shortDescription":"Gemini 3 Flash Preview is a high speed, high value thinking model designed for agentic workflows, multi turn chat, and coding assistance.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file","audio","video"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":182,"createdAt":"2025-12-17T15:57:58.000Z","group":"google/gemini-3-flash-preview-20251217","tier":"pro"},{"slug":"black-forest-labs/flux.2-max","name":"Black Forest Labs: FLUX.2 Max","shortName":"FLUX.2 Max","author":"black-forest-labs","authorDisplay":"Black forest labs","description":"FLUX.2 [max] is the new top-tier image model from Black Forest Labs, pushing image quality, prompt understanding, and editing consistency to the highest level yet. Pricing is as follows, [per...","shortDescription":"FLUX.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":46864,"supportsReasoning":false,"ranking":183,"createdAt":"2025-12-16T03:59:30.000Z","group":"black-forest-labs/flux.2-max","tier":"pro"},{"slug":"nvidia/nemotron-3-nano-30b-a3b","name":"NVIDIA: Nemotron 3 Nano 30B A3B","shortName":"Nemotron 3 Nano 30B A3B","author":"nvidia","authorDisplay":"NVIDIA","description":"NVIDIA Nemotron 3 Nano 30B A3B is a small language MoE model with highest compute efficiency and accuracy for developers to build specialized agentic AI systems. The model is fully...","shortDescription":"NVIDIA Nemotron 3 Nano 30B A3B is a small language MoE model with highest compute efficiency and accuracy for developers to build specialized agentic AI systems.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":184,"createdAt":"2025-12-14T16:54:35.000Z","group":"nvidia/nemotron-3-nano-30b-a3b","tier":"basic"},{"slug":"nvidia/nemotron-3-nano-30b-a3b:free","name":"NVIDIA: Nemotron 3 Nano 30B A3B","shortName":"Nemotron 3 Nano 30B A3B","author":"nvidia","authorDisplay":"NVIDIA","description":"NVIDIA Nemotron 3 Nano 30B A3B is a small language MoE model with highest compute efficiency and accuracy for developers to build specialized agentic AI systems. The model is fully...","shortDescription":"NVIDIA Nemotron 3 Nano 30B A3B is a small language MoE model with highest compute efficiency and accuracy for developers to build specialized agentic AI systems.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":256000,"supportsReasoning":true,"ranking":185,"createdAt":"2025-12-14T16:54:35.000Z","group":"nvidia/nemotron-3-nano-30b-a3b","tier":"basic"},{"slug":"openai/gpt-5.2-chat","name":"OpenAI: GPT-5.2 Chat","shortName":"GPT-5.2 Chat","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.2 Chat (AKA Instant) is the fast, lightweight member of the 5.2 family, optimized for low-latency chat while retaining strong general intelligence. It uses adaptive reasoning to selectively “think” on...","shortDescription":"GPT-5.","categories":["text","multimodal"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":186,"createdAt":"2025-12-10T18:03:03.000Z","group":"openai/gpt-5.2-chat-20251211","tier":"pro"},{"slug":"openai/gpt-5.2","name":"OpenAI: GPT-5.2","shortName":"GPT-5.2","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.2 is the latest frontier-grade model in the GPT-5 series, offering stronger agentic and long context perfomance compared to GPT-5.1. It uses adaptive reasoning to allocate computation dynamically, responding quickly...","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":400000,"supportsReasoning":true,"ranking":187,"createdAt":"2025-12-10T18:02:55.000Z","group":"openai/gpt-5.2-20251211","tier":"pro"},{"slug":"mistralai/devstral-2512","name":"Mistral: Devstral 2 2512","shortName":"Devstral 2 2512","author":"mistralai","authorDisplay":"Mistral AI","description":"Devstral 2 is a state-of-the-art open-source model by Mistral AI specializing in agentic coding. It is a 123B-parameter dense transformer model supporting a 256K context window. Devstral 2 supports exploring...","shortDescription":"Devstral 2 is a state-of-the-art open-source model by Mistral AI specializing in agentic coding.","categories":["text","multimodal"],"inputModalities":["text","file"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":188,"createdAt":"2025-12-09T13:03:39.000Z","group":"mistralai/devstral-2512","tier":"pro"},{"slug":"relace/relace-search","name":"Relace: Relace Search","shortName":"Relace Search","author":"relace","authorDisplay":"Relace","description":"The relace-search model uses 4-12 `view_file` and `grep` tools in parallel to explore a codebase and return relevant files to the user request. In contrast to RAG, relace-search performs agentic...","shortDescription":"The relace-search model uses 4-12 `view_file` and `grep` tools in parallel to explore a codebase and return relevant files to the user request.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":256000,"supportsReasoning":false,"ranking":189,"createdAt":"2025-12-08T17:06:00.000Z","group":"relace/relace-search-20251208","tier":"pro"},{"slug":"z-ai/glm-4.6v","name":"Z.ai: GLM 4.6V","shortName":"GLM 4.6V","author":"z-ai","authorDisplay":"Z ai","description":"GLM-4.6V is a large multimodal model designed for high-fidelity visual understanding and long-context reasoning across images, documents, and mixed media. It supports up to 128K tokens, processes complex page layouts...","shortDescription":"GLM-4.","categories":["text","multimodal","reasoning"],"inputModalities":["image","text","video"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":190,"createdAt":"2025-12-08T15:24:22.000Z","group":"z-ai/glm-4.6-20251208","tier":"basic"},{"slug":"openrouter/bodybuilder","name":"Body Builder (beta)","shortName":"Body Builder (beta)","author":"openrouter","authorDisplay":"Openrouter","description":"Transform your natural language requests into structured OpenRouter API request objects. Describe what you want to accomplish with AI models, and Body Builder will construct the appropriate API calls. Example:...","shortDescription":"Transform your natural language requests into structured OpenRouter API request objects.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":191,"createdAt":"2025-12-05T03:00:53.000Z","group":"openrouter/bodybuilder","tier":"basic"},{"slug":"openai/gpt-5.1-codex-max","name":"OpenAI: GPT-5.1-Codex-Max","shortName":"GPT-5.1-Codex-Max","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.1-Codex-Max is OpenAI’s latest agentic coding model, designed for long-running, high-context software development tasks. It is based on an updated version of the 5.1 reasoning stack and trained on agentic...","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning","coding"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":400000,"supportsReasoning":true,"ranking":192,"createdAt":"2025-12-04T20:08:54.000Z","group":"openai/gpt-5.1-codex-max-20251204","tier":"pro"},{"slug":"amazon/nova-2-lite-v1","name":"Amazon: Nova 2 Lite","shortName":"Nova 2 Lite","author":"amazon","authorDisplay":"Amazon","description":"Nova 2 Lite is a fast, cost-effective reasoning model for everyday workloads that can process text, images, and videos to generate text. Nova 2 Lite demonstrates standout capabilities in processing...","shortDescription":"Nova 2 Lite is a fast, cost-effective reasoning model for everyday workloads that can process text, images, and videos to generate text.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","video","file"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":193,"createdAt":"2025-12-02T17:31:12.000Z","group":"amazon/nova-2-lite-v1","tier":"basic"},{"slug":"mistralai/ministral-14b-2512","name":"Mistral: Ministral 3 14B 2512","shortName":"Ministral 3 14B 2512","author":"mistralai","authorDisplay":"Mistral AI","description":"The largest model in the Ministral 3 family, Ministral 3 14B offers frontier capabilities and performance comparable to its larger Mistral Small 3.2 24B counterpart. A powerful and efficient language...","shortDescription":"The largest model in the Ministral 3 family, Ministral 3 14B offers frontier capabilities and performance comparable to its larger Mistral Small 3.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":194,"createdAt":"2025-12-02T13:22:15.000Z","group":"mistralai/ministral-14b-2512","tier":"basic"},{"slug":"mistralai/ministral-8b-2512","name":"Mistral: Ministral 3 8B 2512","shortName":"Ministral 3 8B 2512","author":"mistralai","authorDisplay":"Mistral AI","description":"A balanced model in the Ministral 3 family, Ministral 3 8B is a powerful, efficient tiny language model with vision capabilities.","shortDescription":"A balanced model in the Ministral 3 family, Ministral 3 8B is a powerful, efficient tiny language model with vision capabilities.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":195,"createdAt":"2025-12-02T13:20:54.000Z","group":"mistralai/ministral-8b-2512","tier":"basic"},{"slug":"mistralai/ministral-3b-2512","name":"Mistral: Ministral 3 3B 2512","shortName":"Ministral 3 3B 2512","author":"mistralai","authorDisplay":"Mistral AI","description":"The smallest model in the Ministral 3 family, Ministral 3 3B is a powerful, efficient tiny language model with vision capabilities.","shortDescription":"The smallest model in the Ministral 3 family, Ministral 3 3B is a powerful, efficient tiny language model with vision capabilities.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":196,"createdAt":"2025-12-02T13:19:20.000Z","group":"mistralai/ministral-3b-2512","tier":"basic"},{"slug":"mistralai/mistral-large-2512","name":"Mistral: Mistral Large 3 2512","shortName":"Mistral Large 3 2512","author":"mistralai","authorDisplay":"Mistral AI","description":"Mistral Large 3 2512 is Mistral’s most capable model to date, featuring a sparse mixture-of-experts architecture with 41B active parameters (675B total), and released under the Apache 2.0 license.","shortDescription":"Mistral Large 3 2512 is Mistral’s most capable model to date, featuring a sparse mixture-of-experts architecture with 41B active parameters (675B total), and...","categories":["text","multimodal"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":197,"createdAt":"2025-12-01T21:27:52.000Z","group":"mistralai/mistral-large-2512","tier":"pro"},{"slug":"deepseek/deepseek-v3.2","name":"DeepSeek: DeepSeek V3.2","shortName":"DeepSeek V3.2","author":"deepseek","authorDisplay":"DeepSeek","description":"DeepSeek-V3.2 is a large language model designed to harmonize high computational efficiency with strong reasoning and agentic tool-use performance. It introduces DeepSeek Sparse Attention (DSA), a fine-grained sparse attention mechanism...","shortDescription":"DeepSeek-V3.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":163840,"supportsReasoning":true,"ranking":198,"createdAt":"2025-12-01T13:10:42.000Z","group":"deepseek/deepseek-v3.2-20251201","tier":"basic"},{"slug":"black-forest-labs/flux.2-flex","name":"Black Forest Labs: FLUX.2 Flex","shortName":"FLUX.2 Flex","author":"black-forest-labs","authorDisplay":"Black forest labs","description":"FLUX.2 [flex] excels at rendering complex text, typography, and fine details, and supports multi-reference editing in the same unified architecture. Pricing is as follows, [per the docs](https://bfl.ai/pricing?category=flux.2): We charge $0.06...","shortDescription":"FLUX.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":67344,"supportsReasoning":false,"ranking":199,"createdAt":"2025-11-25T04:46:27.000Z","group":"black-forest-labs/flux.2-flex","tier":"pro"},{"slug":"black-forest-labs/flux.2-pro","name":"Black Forest Labs: FLUX.2 Pro","shortName":"FLUX.2 Pro","author":"black-forest-labs","authorDisplay":"Black forest labs","description":"A high-end image generation and editing model focused on frontier-level visual quality and reliability. It delivers strong prompt adherence, stable lighting, sharp textures, and consistent character/style reproduction across multi-reference inputs....","shortDescription":"A high-end image generation and editing model focused on frontier-level visual quality and reliability.","categories":["image","multimodal"],"inputModalities":["text","image"],"outputModalities":["image"],"contextLength":46864,"supportsReasoning":false,"ranking":200,"createdAt":"2025-11-25T00:24:34.000Z","group":"black-forest-labs/flux.2-pro","tier":"pro"},{"slug":"anthropic/claude-opus-4.5","name":"Anthropic: Claude Opus 4.5","shortName":"Claude Opus 4.5","author":"anthropic","authorDisplay":"Anthropic","description":"Claude Opus 4.5 is Anthropic’s frontier reasoning model optimized for complex software engineering, agentic workflows, and long-horizon computer use. It offers strong multimodal capabilities, competitive performance across real-world coding and...","shortDescription":"Claude Opus 4.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":200000,"supportsReasoning":true,"ranking":201,"createdAt":"2025-11-24T18:56:20.000Z","group":"anthropic/claude-4.5-opus-20251124","tier":"ultimate"},{"slug":"allenai/olmo-3-32b-think","name":"AllenAI: Olmo 3 32B Think","shortName":"Olmo 3 32B Think","author":"allenai","authorDisplay":"AllenAI","description":"Olmo 3 32B Think is a large-scale, 32-billion-parameter model purpose-built for deep reasoning, complex logic chains and advanced instruction-following scenarios. Its capacity enables strong performance on demanding evaluation tasks and...","shortDescription":"Olmo 3 32B Think is a large-scale, 32-billion-parameter model purpose-built for deep reasoning, complex logic chains and advanced instruction-following scena...","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":65536,"supportsReasoning":true,"ranking":202,"createdAt":"2025-11-21T20:51:16.000Z","group":"allenai/olmo-3-32b-think-20251121","tier":"basic"},{"slug":"google/gemini-3-pro-image-preview","name":"Google: Nano Banana Pro (Gemini 3 Pro Image Preview)","shortName":"Nano Banana Pro (Gemini 3 Pro Image Preview)","author":"google","authorDisplay":"Google","description":"Nano Banana Pro is Google’s most advanced image-generation and editing model, built on Gemini 3 Pro. It extends the original Nano Banana with significantly improved multimodal reasoning, real-world grounding, and...","shortDescription":"Nano Banana Pro is Google’s most advanced image-generation and editing model, built on Gemini 3 Pro.","categories":["image","text","multimodal","reasoning"],"inputModalities":["image","text"],"outputModalities":["image","text"],"contextLength":65536,"supportsReasoning":true,"ranking":203,"createdAt":"2025-11-20T15:49:57.000Z","group":"google/gemini-3-pro-image-preview-20251120","tier":"pro"},{"slug":"deepcogito/cogito-v2.1-671b","name":"Deep Cogito: Cogito v2.1 671B","shortName":"Cogito v2.1 671B","author":"deepcogito","authorDisplay":"Deepcogito","description":"Cogito v2.1 671B MoE represents one of the strongest open models globally, matching performance of frontier closed and open models. This model is trained using self play with reinforcement learning...","shortDescription":"Cogito v2.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":true,"ranking":204,"createdAt":"2025-11-13T22:00:33.000Z","group":"deepcogito/cogito-v2.1-671b-20251118","tier":"pro"},{"slug":"openai/gpt-5.1","name":"OpenAI: GPT-5.1","shortName":"GPT-5.1","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.1 is the latest frontier-grade model in the GPT-5 series, offering stronger general-purpose reasoning, improved instruction adherence, and a more natural conversational style compared to GPT-5. It uses adaptive reasoning...","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning"],"inputModalities":["image","text","file"],"outputModalities":["text"],"contextLength":400000,"supportsReasoning":true,"ranking":205,"createdAt":"2025-11-13T18:58:25.000Z","group":"openai/gpt-5.1-20251113","tier":"pro"},{"slug":"openai/gpt-5.1-chat","name":"OpenAI: GPT-5.1 Chat","shortName":"GPT-5.1 Chat","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.1 Chat (AKA Instant is the fast, lightweight member of the 5.1 family, optimized for low-latency chat while retaining strong general intelligence. It uses adaptive reasoning to selectively “think” on...","shortDescription":"GPT-5.","categories":["text","multimodal"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":206,"createdAt":"2025-11-13T18:58:22.000Z","group":"openai/gpt-5.1-chat-20251113","tier":"pro"},{"slug":"openai/gpt-5.1-codex","name":"OpenAI: GPT-5.1-Codex","shortName":"GPT-5.1-Codex","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.1-Codex is a specialized version of GPT-5.1 optimized for software engineering and coding workflows. It is designed for both interactive development sessions and long, independent execution of complex engineering tasks....","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning","coding"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":400000,"supportsReasoning":true,"ranking":207,"createdAt":"2025-11-13T18:58:18.000Z","group":"openai/gpt-5.1-codex-20251113","tier":"pro"},{"slug":"openai/gpt-5.1-codex-mini","name":"OpenAI: GPT-5.1-Codex-Mini","shortName":"GPT-5.1-Codex-Mini","author":"openai","authorDisplay":"OpenAI","description":"GPT-5.1-Codex-Mini is a smaller and faster version of GPT-5.1-Codex","shortDescription":"GPT-5.","categories":["text","multimodal","reasoning","coding"],"inputModalities":["image","text"],"outputModalities":["text"],"contextLength":400000,"supportsReasoning":true,"ranking":208,"createdAt":"2025-11-13T18:17:00.000Z","group":"openai/gpt-5.1-codex-mini-20251113","tier":"basic"},{"slug":"moonshotai/kimi-k2-thinking","name":"MoonshotAI: Kimi K2 Thinking","shortName":"Kimi K2 Thinking","author":"moonshotai","authorDisplay":"Moonshotai","description":"Kimi K2 Thinking is Moonshot AI’s most advanced open reasoning model to date, extending the K2 series into agentic, long-horizon reasoning. Built on the trillion-parameter Mixture-of-Experts (MoE) architecture introduced in...","shortDescription":"Kimi K2 Thinking is Moonshot AI’s most advanced open reasoning model to date, extending the K2 series into agentic, long-horizon reasoning.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":209,"createdAt":"2025-11-06T14:50:22.000Z","group":"moonshotai/kimi-k2-thinking-20251106","tier":"pro"},{"slug":"amazon/nova-premier-v1","name":"Amazon: Nova Premier 1.0","shortName":"Nova Premier 1.0","author":"amazon","authorDisplay":"Amazon","description":"Amazon Nova Premier is the most capable of Amazon’s multimodal models for complex reasoning tasks and for use as the best teacher for distilling custom models.","shortDescription":"Amazon Nova Premier is the most capable of Amazon’s multimodal models for complex reasoning tasks and for use as the best teacher for distilling custom models.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":false,"ranking":210,"createdAt":"2025-10-31T22:38:52.000Z","group":"amazon/nova-premier-v1","tier":"pro"},{"slug":"perplexity/sonar-pro-search","name":"Perplexity: Sonar Pro Search","shortName":"Sonar Pro Search","author":"perplexity","authorDisplay":"Perplexity","description":"Exclusively available on the OpenRouter API, Sonar Pro's new Pro Search mode is Perplexity's most advanced agentic search system. It is designed for deeper reasoning and analysis. Pricing is based...","shortDescription":"Exclusively available on the OpenRouter API, Sonar Pro's new Pro Search mode is Perplexity's most advanced agentic search system.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":200000,"supportsReasoning":true,"ranking":211,"createdAt":"2025-10-30T19:59:26.000Z","group":"perplexity/sonar-pro-search","tier":"pro"},{"slug":"mistralai/voxtral-small-24b-2507","name":"Mistral: Voxtral Small 24B 2507","shortName":"Voxtral Small 24B 2507","author":"mistralai","authorDisplay":"Mistral AI","description":"Voxtral Small is an enhancement of Mistral Small 3, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance. It excels at speech transcription, translation and audio understanding. Input audio...","shortDescription":"Voxtral Small is an enhancement of Mistral Small 3, incorporating state-of-the-art audio input capabilities while retaining best-in-class text performance.","categories":["text","multimodal"],"inputModalities":["text","audio","file"],"outputModalities":["text"],"contextLength":32000,"supportsReasoning":false,"ranking":212,"createdAt":"2025-10-30T14:39:04.000Z","group":"mistralai/voxtral-small-24b-2507","tier":"basic"},{"slug":"openai/gpt-oss-safeguard-20b","name":"OpenAI: gpt-oss-safeguard-20b","shortName":"gpt-oss-safeguard-20b","author":"openai","authorDisplay":"OpenAI","description":"gpt-oss-safeguard-20b is a safety reasoning model from OpenAI built upon gpt-oss-20b. This open-weight, 21B-parameter Mixture-of-Experts (MoE) model offers lower latency for safety tasks like content classification, LLM filtering, and trust...","shortDescription":"gpt-oss-safeguard-20b is a safety reasoning model from OpenAI built upon gpt-oss-20b.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":213,"createdAt":"2025-10-29T15:47:16.000Z","group":"openai/gpt-oss-safeguard-20b","tier":"basic"},{"slug":"nvidia/nemotron-nano-12b-v2-vl:free","name":"NVIDIA: Nemotron Nano 12B 2 VL","shortName":"Nemotron Nano 12B 2 VL","author":"nvidia","authorDisplay":"NVIDIA","description":"NVIDIA Nemotron Nano 2 VL is a 12-billion-parameter open multimodal reasoning model designed for video understanding and document intelligence. It introduces a hybrid Transformer-Mamba architecture, combining transformer-level accuracy with Mamba’s...","shortDescription":"NVIDIA Nemotron Nano 2 VL is a 12-billion-parameter open multimodal reasoning model designed for video understanding and document intelligence.","categories":["text","multimodal","reasoning"],"inputModalities":["image","text","video"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":true,"ranking":214,"createdAt":"2025-10-28T18:19:25.000Z","group":"nvidia/nemotron-nano-12b-v2-vl","tier":"basic"},{"slug":"minimax/minimax-m2","name":"MiniMax: MiniMax M2","shortName":"MiniMax M2","author":"minimax","authorDisplay":"Minimax","description":"MiniMax-M2 is a compact, high-efficiency large language model optimized for end-to-end coding and agentic workflows. With 10 billion activated parameters (230 billion total), it delivers near-frontier intelligence across general reasoning,...","shortDescription":"MiniMax-M2 is a compact, high-efficiency large language model optimized for end-to-end coding and agentic workflows.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":204800,"supportsReasoning":true,"ranking":215,"createdAt":"2025-10-23T20:41:33.000Z","group":"minimax/minimax-m2","tier":"basic"},{"slug":"qwen/qwen3-vl-32b-instruct","name":"Qwen: Qwen3 VL 32B Instruct","shortName":"Qwen3 VL 32B Instruct","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-VL-32B-Instruct is a large-scale multimodal vision-language model designed for high-precision understanding and reasoning across text, images, and video. With 32 billion parameters, it combines deep visual perception with advanced text...","shortDescription":"Qwen3-VL-32B-Instruct is a large-scale multimodal vision-language model designed for high-precision understanding and reasoning across text, images, and video.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":216,"createdAt":"2025-10-23T14:55:32.000Z","group":"qwen/qwen3-vl-32b-instruct","tier":"basic"},{"slug":"ibm-granite/granite-4.0-h-micro","name":"IBM: Granite 4.0 Micro","shortName":"Granite 4.0 Micro","author":"ibm-granite","authorDisplay":"Ibm granite","description":"Granite-4.0-H-Micro is a 3B parameter from the Granite 4 family of models. These models are the latest in a series of models released by IBM. They are fine-tuned for long...","shortDescription":"Granite-4.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131000,"supportsReasoning":false,"ranking":217,"createdAt":"2025-10-20T02:34:55.000Z","group":"ibm-granite/granite-4.0-h-micro","tier":"basic"},{"slug":"openai/gpt-5-image-mini","name":"OpenAI: GPT-5 Image Mini","shortName":"GPT-5 Image Mini","author":"openai","authorDisplay":"OpenAI","description":"GPT-5 Image Mini combines OpenAI's advanced language capabilities, powered by [GPT-5 Mini](https://openrouter.ai/openai/gpt-5-mini), with GPT Image 1 Mini for efficient image generation. This natively multimodal model features superior instruction following, text...","shortDescription":"GPT-5 Image Mini combines OpenAI's advanced language capabilities, powered by [GPT-5 Mini](https://openrouter.","categories":["image","text","multimodal","reasoning"],"inputModalities":["file","image","text"],"outputModalities":["image","text"],"contextLength":400000,"supportsReasoning":true,"ranking":218,"createdAt":"2025-10-16T14:23:03.000Z","group":"openai/gpt-5-image-mini","tier":"pro"},{"slug":"anthropic/claude-haiku-4.5","name":"Anthropic: Claude Haiku 4.5","shortName":"Claude Haiku 4.5","author":"anthropic","authorDisplay":"Anthropic","description":"Claude Haiku 4.5 is Anthropic’s fastest and most efficient model, delivering near-frontier intelligence at a fraction of the cost and latency of larger Claude models. Matching Claude Sonnet 4’s performance...","shortDescription":"Claude Haiku 4.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":200000,"supportsReasoning":true,"ranking":219,"createdAt":"2025-10-15T17:00:38.000Z","group":"anthropic/claude-4.5-haiku-20251001","tier":"pro"},{"slug":"qwen/qwen3-vl-8b-thinking","name":"Qwen: Qwen3 VL 8B Thinking","shortName":"Qwen3 VL 8B Thinking","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-VL-8B-Thinking is the reasoning-optimized variant of the Qwen3-VL-8B multimodal model, designed for advanced visual and textual reasoning across complex scenes, documents, and temporal sequences. It integrates enhanced multimodal alignment and...","shortDescription":"Qwen3-VL-8B-Thinking is the reasoning-optimized variant of the Qwen3-VL-8B multimodal model, designed for advanced visual and textual reasoning across comple...","categories":["text","multimodal","reasoning"],"inputModalities":["image","text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":220,"createdAt":"2025-10-14T17:42:26.000Z","group":"qwen/qwen3-vl-8b-thinking","tier":"basic"},{"slug":"qwen/qwen3-vl-8b-instruct","name":"Qwen: Qwen3 VL 8B Instruct","shortName":"Qwen3 VL 8B Instruct","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-VL-8B-Instruct is a multimodal vision-language model from the Qwen3-VL series, built for high-fidelity understanding and reasoning across text, images, and video. It features improved multimodal fusion with Interleaved-MRoPE for long-horizon...","shortDescription":"Qwen3-VL-8B-Instruct is a multimodal vision-language model from the Qwen3-VL series, built for high-fidelity understanding and reasoning across text, images,...","categories":["text","multimodal"],"inputModalities":["image","text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":221,"createdAt":"2025-10-14T17:35:08.000Z","group":"qwen/qwen3-vl-8b-instruct","tier":"basic"},{"slug":"openai/o4-mini-deep-research","name":"OpenAI: o4 Mini Deep Research","shortName":"o4 Mini Deep Research","author":"openai","authorDisplay":"OpenAI","description":"o4-mini-deep-research is OpenAI's faster, more affordable deep research model—ideal for tackling complex, multi-step research tasks.\n\nNote: This model always uses the 'web_search' tool which adds additional cost.","shortDescription":"o4-mini-deep-research is OpenAI's faster, more affordable deep research model—ideal for tackling complex, multi-step research tasks.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":200000,"supportsReasoning":true,"ranking":222,"createdAt":"2025-10-10T20:54:02.000Z","group":"openai/o4-mini-deep-research-2025-06-26","tier":"pro"},{"slug":"google/gemini-2.5-flash-image","name":"Google: Nano Banana (Gemini 2.5 Flash Image)","shortName":"Nano Banana (Gemini 2.5 Flash Image)","author":"google","authorDisplay":"Google","description":"Gemini 2.5 Flash Image, a.k.a. \"Nano Banana,\" is now generally available. It is a state of the art image generation model with contextual understanding. It is capable of image generation,...","shortDescription":"Gemini 2.","categories":["image","text","multimodal"],"inputModalities":["image","text"],"outputModalities":["image","text"],"contextLength":32768,"supportsReasoning":false,"ranking":223,"createdAt":"2025-10-07T20:53:51.000Z","group":"google/gemini-2.5-flash-image","tier":"basic"},{"slug":"qwen/qwen3-vl-30b-a3b-thinking","name":"Qwen: Qwen3 VL 30B A3B Thinking","shortName":"Qwen3 VL 30B A3B Thinking","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-VL-30B-A3B-Thinking is a multimodal model that unifies strong text generation with visual understanding for images and videos. Its Thinking variant enhances reasoning in STEM, math, and complex tasks. It excels...","shortDescription":"Qwen3-VL-30B-A3B-Thinking is a multimodal model that unifies strong text generation with visual understanding for images and videos.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":224,"createdAt":"2025-10-06T23:47:59.000Z","group":"qwen/qwen3-vl-30b-a3b-thinking","tier":"basic"},{"slug":"qwen/qwen3-vl-30b-a3b-instruct","name":"Qwen: Qwen3 VL 30B A3B Instruct","shortName":"Qwen3 VL 30B A3B Instruct","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-VL-30B-A3B-Instruct is a multimodal model that unifies strong text generation with visual understanding for images and videos. Its Instruct variant optimizes instruction-following for general multimodal tasks. It excels in perception...","shortDescription":"Qwen3-VL-30B-A3B-Instruct is a multimodal model that unifies strong text generation with visual understanding for images and videos.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":225,"createdAt":"2025-10-06T23:47:56.000Z","group":"qwen/qwen3-vl-30b-a3b-instruct","tier":"basic"},{"slug":"z-ai/glm-4.6","name":"Z.ai: GLM 4.6","shortName":"GLM 4.6","author":"z-ai","authorDisplay":"Z ai","description":"Compared with GLM-4.5, this generation brings several key improvements: Longer context window: The context window has been expanded from 128K to 200K tokens, enabling the model to handle more complex...","shortDescription":"Compared with GLM-4.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":204800,"supportsReasoning":true,"ranking":226,"createdAt":"2025-09-30T12:32:56.000Z","group":"z-ai/glm-4.6","tier":"pro"},{"slug":"anthropic/claude-sonnet-4.5","name":"Anthropic: Claude Sonnet 4.5","shortName":"Claude Sonnet 4.5","author":"anthropic","authorDisplay":"Anthropic","description":"Claude Sonnet 4.5 is Anthropic’s most advanced Sonnet model to date, optimized for real-world agents and coding workflows. It delivers state-of-the-art performance on coding benchmarks such as SWE-bench Verified, with...","shortDescription":"Claude Sonnet 4.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":227,"createdAt":"2025-09-29T16:01:16.000Z","group":"anthropic/claude-4.5-sonnet-20250929","tier":"pro"},{"slug":"deepseek/deepseek-v3.2-exp","name":"DeepSeek: DeepSeek V3.2 Exp","shortName":"DeepSeek V3.2 Exp","author":"deepseek","authorDisplay":"DeepSeek","description":"DeepSeek-V3.2-Exp is an experimental large language model released by DeepSeek as an intermediate step between V3.1 and future architectures. It introduces DeepSeek Sparse Attention (DSA), a fine-grained sparse attention mechanism...","shortDescription":"DeepSeek-V3.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":163840,"supportsReasoning":true,"ranking":228,"createdAt":"2025-09-29T12:54:41.000Z","group":"deepseek/deepseek-v3.2-exp","tier":"basic"},{"slug":"thedrummer/cydonia-24b-v4.1","name":"TheDrummer: Cydonia 24B V4.1","shortName":"Cydonia 24B V4.1","author":"thedrummer","authorDisplay":"Thedrummer","description":"Uncensored and creative writing model based on Mistral Small 3.2 24B with good recall, prompt adherence, and intelligence.","shortDescription":"Uncensored and creative writing model based on Mistral Small 3.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":229,"createdAt":"2025-09-27T00:11:18.000Z","group":"thedrummer/cydonia-24b-v4.1","tier":"basic"},{"slug":"relace/relace-apply-3","name":"Relace: Relace Apply 3","shortName":"Relace Apply 3","author":"relace","authorDisplay":"Relace","description":"Relace Apply 3 is a specialized code-patching LLM that merges AI-suggested edits straight into your source files. It can apply updates from GPT-4o, Claude, and others into your files at...","shortDescription":"Relace Apply 3 is a specialized code-patching LLM that merges AI-suggested edits straight into your source files.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":256000,"supportsReasoning":false,"ranking":230,"createdAt":"2025-09-26T12:59:32.000Z","group":"relace/relace-apply-3","tier":"pro"},{"slug":"qwen/qwen3-vl-235b-a22b-thinking","name":"Qwen: Qwen3 VL 235B A22B Thinking","shortName":"Qwen3 VL 235B A22B Thinking","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-VL-235B-A22B Thinking is a multimodal model that unifies strong text generation with visual understanding across images and video. The Thinking model is optimized for multimodal reasoning in STEM and math....","shortDescription":"Qwen3-VL-235B-A22B Thinking is a multimodal model that unifies strong text generation with visual understanding across images and video.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":231,"createdAt":"2025-09-23T23:04:50.000Z","group":"qwen/qwen3-vl-235b-a22b-thinking","tier":"basic"},{"slug":"qwen/qwen3-vl-235b-a22b-instruct","name":"Qwen: Qwen3 VL 235B A22B Instruct","shortName":"Qwen3 VL 235B A22B Instruct","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-VL-235B-A22B Instruct is an open-weight multimodal model that unifies strong text generation with visual understanding across images and video. The Instruct model targets general vision-language use (VQA, document parsing, chart/table...","shortDescription":"Qwen3-VL-235B-A22B Instruct is an open-weight multimodal model that unifies strong text generation with visual understanding across images and video.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":232,"createdAt":"2025-09-23T23:04:47.000Z","group":"qwen/qwen3-vl-235b-a22b-instruct","tier":"basic"},{"slug":"qwen/qwen3-max","name":"Qwen: Qwen3 Max","shortName":"Qwen3 Max","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-Max is an updated release built on the Qwen3 series, offering major improvements in reasoning, instruction following, multilingual support, and long-tail knowledge coverage compared to the January 2025 version. It...","shortDescription":"Qwen3-Max is an updated release built on the Qwen3 series, offering major improvements in reasoning, instruction following, multilingual support, and long-ta...","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":233,"createdAt":"2025-09-23T21:26:48.000Z","group":"qwen/qwen3-max","tier":"pro"},{"slug":"qwen/qwen3-coder-plus","name":"Qwen: Qwen3 Coder Plus","shortName":"Qwen3 Coder Plus","author":"qwen","authorDisplay":"Qwen","description":"Qwen3 Coder Plus is Alibaba's proprietary version of the Open Source Qwen3 Coder 480B A35B. It is a powerful coding agent model specializing in autonomous programming via tool calling and...","shortDescription":"Qwen3 Coder Plus is Alibaba's proprietary version of the Open Source Qwen3 Coder 480B A35B.","categories":["text","reasoning","coding"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":234,"createdAt":"2025-09-23T21:25:07.000Z","group":"qwen/qwen3-coder-plus","tier":"pro"},{"slug":"openai/gpt-5-codex","name":"OpenAI: GPT-5 Codex","shortName":"GPT-5 Codex","author":"openai","authorDisplay":"OpenAI","description":"GPT-5-Codex is a specialized version of GPT-5 optimized for software engineering and coding workflows. It is designed for both interactive development sessions and long, independent execution of complex engineering tasks....","shortDescription":"GPT-5-Codex is a specialized version of GPT-5 optimized for software engineering and coding workflows.","categories":["text","multimodal","reasoning","coding"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":400000,"supportsReasoning":true,"ranking":235,"createdAt":"2025-09-23T16:03:23.000Z","group":"openai/gpt-5-codex","tier":"pro"},{"slug":"deepseek/deepseek-v3.1-terminus","name":"DeepSeek: DeepSeek V3.1 Terminus","shortName":"DeepSeek V3.1 Terminus","author":"deepseek","authorDisplay":"DeepSeek","description":"DeepSeek-V3.1 Terminus is an update to [DeepSeek V3.1](/deepseek/deepseek-chat-v3.1) that maintains the model's original capabilities while addressing issues reported by users, including language consistency and agent capabilities, further optimizing the model's...","shortDescription":"DeepSeek-V3.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":163840,"supportsReasoning":true,"ranking":236,"createdAt":"2025-09-22T13:37:55.000Z","group":"deepseek/deepseek-v3.1-terminus","tier":"basic"},{"slug":"qwen/qwen3-coder-flash","name":"Qwen: Qwen3 Coder Flash","shortName":"Qwen3 Coder Flash","author":"qwen","authorDisplay":"Qwen","description":"Qwen3 Coder Flash is Alibaba's fast and cost efficient version of their proprietary Qwen3 Coder Plus. It is a powerful coding agent model specializing in autonomous programming via tool calling...","shortDescription":"Qwen3 Coder Flash is Alibaba's fast and cost efficient version of their proprietary Qwen3 Coder Plus.","categories":["text","coding"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":false,"ranking":237,"createdAt":"2025-09-17T13:25:36.000Z","group":"qwen/qwen3-coder-flash","tier":"basic"},{"slug":"qwen/qwen3-next-80b-a3b-thinking","name":"Qwen: Qwen3 Next 80B A3B Thinking","shortName":"Qwen3 Next 80B A3B Thinking","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-Next-80B-A3B-Thinking is a reasoning-first chat model in the Qwen3-Next line that outputs structured “thinking” traces by default. It’s designed for hard multi-step problems; math proofs, code synthesis/debugging, logic, and agentic...","shortDescription":"Qwen3-Next-80B-A3B-Thinking is a reasoning-first chat model in the Qwen3-Next line that outputs structured “thinking” traces by default.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":238,"createdAt":"2025-09-11T17:38:04.000Z","group":"qwen/qwen3-next-80b-a3b-thinking-2509","tier":"basic"},{"slug":"qwen/qwen3-next-80b-a3b-instruct","name":"Qwen: Qwen3 Next 80B A3B Instruct","shortName":"Qwen3 Next 80B A3B Instruct","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-Next-80B-A3B-Instruct is an instruction-tuned chat model in the Qwen3-Next series optimized for fast, stable responses without “thinking” traces. It targets complex tasks across reasoning, code generation, knowledge QA, and multilingual...","shortDescription":"Qwen3-Next-80B-A3B-Instruct is an instruction-tuned chat model in the Qwen3-Next series optimized for fast, stable responses without “thinking” traces.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":239,"createdAt":"2025-09-11T17:36:53.000Z","group":"qwen/qwen3-next-80b-a3b-instruct-2509","tier":"basic"},{"slug":"qwen/qwen-plus-2025-07-28","name":"Qwen: Qwen Plus 0728","shortName":"Qwen Plus 0728","author":"qwen","authorDisplay":"Qwen","description":"Qwen Plus 0728, based on the Qwen3 foundation model, is a 1 million context hybrid reasoning model with a balanced performance, speed, and cost combination.","shortDescription":"Qwen Plus 0728, based on the Qwen3 foundation model, is a 1 million context hybrid reasoning model with a balanced performance, speed, and cost combination.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":240,"createdAt":"2025-09-08T16:06:39.000Z","group":"qwen/qwen-plus-2025-07-28","tier":"basic"},{"slug":"qwen/qwen-plus-2025-07-28:thinking","name":"Qwen: Qwen Plus 0728 (thinking)","shortName":"Qwen Plus 0728 (thinking)","author":"qwen","authorDisplay":"Qwen","description":"Qwen Plus 0728, based on the Qwen3 foundation model, is a 1 million context hybrid reasoning model with a balanced performance, speed, and cost combination.","shortDescription":"Qwen Plus 0728, based on the Qwen3 foundation model, is a 1 million context hybrid reasoning model with a balanced performance, speed, and cost combination.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":241,"createdAt":"2025-09-08T16:06:39.000Z","group":"qwen/qwen-plus-2025-07-28","tier":"basic"},{"slug":"nvidia/nemotron-nano-9b-v2:free","name":"NVIDIA: Nemotron Nano 9B V2","shortName":"Nemotron Nano 9B V2","author":"nvidia","authorDisplay":"NVIDIA","description":"NVIDIA-Nemotron-Nano-9B-v2 is a large language model (LLM) trained from scratch by NVIDIA, and designed as a unified model for both reasoning and non-reasoning tasks. It responds to user queries and...","shortDescription":"NVIDIA-Nemotron-Nano-9B-v2 is a large language model (LLM) trained from scratch by NVIDIA, and designed as a unified model for both reasoning and non-reasoni...","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":true,"ranking":242,"createdAt":"2025-09-05T21:13:27.000Z","group":"nvidia/nemotron-nano-9b-v2","tier":"basic"},{"slug":"moonshotai/kimi-k2-0905","name":"MoonshotAI: Kimi K2 0905","shortName":"Kimi K2 0905","author":"moonshotai","authorDisplay":"Moonshotai","description":"Kimi K2 0905 is the September update of [Kimi K2 0711](moonshotai/kimi-k2). It is a large-scale Mixture-of-Experts (MoE) language model developed by Moonshot AI, featuring 1 trillion total parameters with 32...","shortDescription":"Kimi K2 0905 is the September update of [Kimi K2 0711](moonshotai/kimi-k2).","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":243,"createdAt":"2025-09-04T21:25:47.000Z","group":"moonshotai/kimi-k2-0905","tier":"pro"},{"slug":"qwen/qwen3-30b-a3b-thinking-2507","name":"Qwen: Qwen3 30B A3B Thinking 2507","shortName":"Qwen3 30B A3B Thinking 2507","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-30B-A3B-Thinking-2507 is a 30B parameter Mixture-of-Experts reasoning model optimized for complex tasks requiring extended multi-step thinking. The model is designed specifically for “thinking mode,” where internal reasoning traces are separated...","shortDescription":"Qwen3-30B-A3B-Thinking-2507 is a 30B parameter Mixture-of-Experts reasoning model optimized for complex tasks requiring extended multi-step thinking.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":81920,"supportsReasoning":true,"ranking":244,"createdAt":"2025-08-28T16:39:52.000Z","group":"qwen/qwen3-30b-a3b-thinking-2507","tier":"basic"},{"slug":"nousresearch/hermes-4-70b","name":"Nous: Hermes 4 70B","shortName":"Hermes 4 70B","author":"nousresearch","authorDisplay":"Nousresearch","description":"Hermes 4 70B is a hybrid reasoning model from Nous Research, built on Meta-Llama-3.1-70B. It introduces the same hybrid mode as the larger 405B release, allowing the model to either...","shortDescription":"Hermes 4 70B is a hybrid reasoning model from Nous Research, built on Meta-Llama-3.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":245,"createdAt":"2025-08-26T19:23:02.000Z","group":"nousresearch/hermes-4-70b","tier":"basic"},{"slug":"nousresearch/hermes-4-405b","name":"Nous: Hermes 4 405B","shortName":"Hermes 4 405B","author":"nousresearch","authorDisplay":"Nousresearch","description":"Hermes 4 is a large-scale reasoning model built on Meta-Llama-3.1-405B and released by Nous Research. It introduces a hybrid reasoning mode, where the model can choose to deliberate internally with...","shortDescription":"Hermes 4 is a large-scale reasoning model built on Meta-Llama-3.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":246,"createdAt":"2025-08-26T19:11:03.000Z","group":"nousresearch/hermes-4-405b","tier":"pro"},{"slug":"deepseek/deepseek-chat-v3.1","name":"DeepSeek: DeepSeek V3.1","shortName":"DeepSeek V3.1","author":"deepseek","authorDisplay":"DeepSeek","description":"DeepSeek-V3.1 is a large hybrid reasoning model (671B parameters, 37B active) that supports both thinking and non-thinking modes via prompt templates. It extends the DeepSeek-V3 base with a two-phase long-context...","shortDescription":"DeepSeek-V3.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":163840,"supportsReasoning":true,"ranking":247,"createdAt":"2025-08-21T12:33:48.000Z","group":"deepseek/deepseek-chat-v3.1","tier":"basic"},{"slug":"mistralai/mistral-medium-3.1","name":"Mistral: Mistral Medium 3.1","shortName":"Mistral Medium 3.1","author":"mistralai","authorDisplay":"Mistral AI","description":"Mistral Medium 3.1 is an updated version of Mistral Medium 3, which is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced operational cost. It balances...","shortDescription":"Mistral Medium 3.","categories":["text","multimodal"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":248,"createdAt":"2025-08-13T14:33:59.000Z","group":"mistralai/mistral-medium-3.1","tier":"pro"},{"slug":"z-ai/glm-4.5v","name":"Z.ai: GLM 4.5V","shortName":"GLM 4.5V","author":"z-ai","authorDisplay":"Z ai","description":"GLM-4.5V is a vision-language foundation model for multimodal agent applications. Built on a Mixture-of-Experts (MoE) architecture with 106B parameters and 12B activated parameters, it achieves state-of-the-art results in video understanding,...","shortDescription":"GLM-4.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":65536,"supportsReasoning":true,"ranking":249,"createdAt":"2025-08-11T14:24:48.000Z","group":"z-ai/glm-4.5v","tier":"pro"},{"slug":"ai21/jamba-large-1.7","name":"AI21: Jamba Large 1.7","shortName":"Jamba Large 1.7","author":"ai21","authorDisplay":"Ai21","description":"Jamba Large 1.7 is the latest model in the Jamba open family, offering improvements in grounding, instruction-following, and overall efficiency. Built on a hybrid SSM-Transformer architecture with a 256K context...","shortDescription":"Jamba Large 1.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":256000,"supportsReasoning":false,"ranking":250,"createdAt":"2025-08-08T16:03:40.000Z","group":"ai21/jamba-large-1.7","tier":"pro"},{"slug":"openai/gpt-5-chat","name":"OpenAI: GPT-5 Chat","shortName":"GPT-5 Chat","author":"openai","authorDisplay":"OpenAI","description":"GPT-5 Chat is designed for advanced, natural, multimodal, and context-aware conversations for enterprise applications.","shortDescription":"GPT-5 Chat is designed for advanced, natural, multimodal, and context-aware conversations for enterprise applications.","categories":["text","multimodal"],"inputModalities":["file","image","text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":251,"createdAt":"2025-08-07T17:30:37.000Z","group":"openai/gpt-5-chat-2025-08-07","tier":"pro"},{"slug":"openai/gpt-5","name":"OpenAI: GPT-5","shortName":"GPT-5","author":"openai","authorDisplay":"OpenAI","description":"GPT-5 is OpenAI’s most advanced model, offering major improvements in reasoning, code quality, and user experience. It is optimized for complex tasks that require step-by-step reasoning, instruction following, and accuracy...","shortDescription":"GPT-5 is OpenAI’s most advanced model, offering major improvements in reasoning, code quality, and user experience.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":400000,"supportsReasoning":true,"ranking":252,"createdAt":"2025-08-07T17:23:33.000Z","group":"openai/gpt-5-2025-08-07","tier":"pro"},{"slug":"openai/gpt-5-mini","name":"OpenAI: GPT-5 Mini","shortName":"GPT-5 Mini","author":"openai","authorDisplay":"OpenAI","description":"GPT-5 Mini is a compact version of GPT-5, designed to handle lighter-weight reasoning tasks. It provides the same instruction-following and safety-tuning benefits as GPT-5, but with reduced latency and cost....","shortDescription":"GPT-5 Mini is a compact version of GPT-5, designed to handle lighter-weight reasoning tasks.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":400000,"supportsReasoning":true,"ranking":253,"createdAt":"2025-08-07T17:23:27.000Z","group":"openai/gpt-5-mini-2025-08-07","tier":"basic"},{"slug":"openai/gpt-5-nano","name":"OpenAI: GPT-5 Nano","shortName":"GPT-5 Nano","author":"openai","authorDisplay":"OpenAI","description":"GPT-5-Nano is the smallest and fastest variant in the GPT-5 system, optimized for developer tools, rapid interactions, and ultra-low latency environments. While limited in reasoning depth compared to its larger...","shortDescription":"GPT-5-Nano is the smallest and fastest variant in the GPT-5 system, optimized for developer tools, rapid interactions, and ultra-low latency environments.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":400000,"supportsReasoning":true,"ranking":254,"createdAt":"2025-08-07T17:23:22.000Z","group":"openai/gpt-5-nano-2025-08-07","tier":"basic"},{"slug":"openai/gpt-oss-120b","name":"OpenAI: gpt-oss-120b","shortName":"gpt-oss-120b","author":"openai","authorDisplay":"OpenAI","description":"gpt-oss-120b is an open-weight, 117B-parameter Mixture-of-Experts (MoE) language model from OpenAI designed for high-reasoning, agentic, and general-purpose production use cases. It activates 5.1B parameters per forward pass and is optimized...","shortDescription":"gpt-oss-120b is an open-weight, 117B-parameter Mixture-of-Experts (MoE) language model from OpenAI designed for high-reasoning, agentic, and general-purpose ...","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":255,"createdAt":"2025-08-05T17:17:11.000Z","group":"openai/gpt-oss-120b","tier":"basic"},{"slug":"openai/gpt-oss-20b","name":"OpenAI: gpt-oss-20b","shortName":"gpt-oss-20b","author":"openai","authorDisplay":"OpenAI","description":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.0 license. It uses a Mixture-of-Experts (MoE) architecture with 3.6B active parameters per forward pass, optimized for...","shortDescription":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":256,"createdAt":"2025-08-05T17:17:09.000Z","group":"openai/gpt-oss-20b","tier":"basic"},{"slug":"openai/gpt-oss-20b:free","name":"OpenAI: gpt-oss-20b","shortName":"gpt-oss-20b","author":"openai","authorDisplay":"OpenAI","description":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.0 license. It uses a Mixture-of-Experts (MoE) architecture with 3.6B active parameters per forward pass, optimized for...","shortDescription":"gpt-oss-20b is an open-weight 21B parameter model released by OpenAI under the Apache 2.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":257,"createdAt":"2025-08-05T17:17:09.000Z","group":"openai/gpt-oss-20b","tier":"basic"},{"slug":"mistralai/codestral-2508","name":"Mistral: Codestral 2508","shortName":"Codestral 2508","author":"mistralai","authorDisplay":"Mistral AI","description":"Mistral's cutting-edge language model for coding released end of July 2025. Codestral specializes in low-latency, high-frequency tasks such as fill-in-the-middle (FIM), code correction and test generation.\n\n[Blog Post](https://mistral.ai/news/codestral-25-08)","shortDescription":"Mistral's cutting-edge language model for coding released end of July 2025.","categories":["text","multimodal","coding"],"inputModalities":["text","file"],"outputModalities":["text"],"contextLength":256000,"supportsReasoning":false,"ranking":258,"createdAt":"2025-08-01T20:20:30.000Z","group":"mistralai/codestral-2508","tier":"basic"},{"slug":"qwen/qwen3-coder-30b-a3b-instruct","name":"Qwen: Qwen3 Coder 30B A3B Instruct","shortName":"Qwen3 Coder 30B A3B Instruct","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-Coder-30B-A3B-Instruct is a 30.5B parameter Mixture-of-Experts (MoE) model with 128 experts (8 active per forward pass), designed for advanced code generation, repository-scale understanding, and agentic tool use. Built on the...","shortDescription":"Qwen3-Coder-30B-A3B-Instruct is a 30.","categories":["text","coding"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":259,"createdAt":"2025-07-31T14:32:59.000Z","group":"qwen/qwen3-coder-30b-a3b-instruct","tier":"basic"},{"slug":"qwen/qwen3-30b-a3b-instruct-2507","name":"Qwen: Qwen3 30B A3B Instruct 2507","shortName":"Qwen3 30B A3B Instruct 2507","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-30B-A3B-Instruct-2507 is a 30.5B-parameter mixture-of-experts language model from Qwen, with 3.3B active parameters per inference. It operates in non-thinking mode and is designed for high-quality instruction following, multilingual understanding, and...","shortDescription":"Qwen3-30B-A3B-Instruct-2507 is a 30.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":260,"createdAt":"2025-07-29T16:36:05.000Z","group":"qwen/qwen3-30b-a3b-instruct-2507","tier":"basic"},{"slug":"z-ai/glm-4.5","name":"Z.ai: GLM 4.5","shortName":"GLM 4.5","author":"z-ai","authorDisplay":"Z ai","description":"GLM-4.5 is our latest flagship foundation model, purpose-built for agent-based applications. It leverages a Mixture-of-Experts (MoE) architecture and supports a context length of up to 128k tokens. GLM-4.5 delivers significantly...","shortDescription":"GLM-4.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":261,"createdAt":"2025-07-25T19:22:27.000Z","group":"z-ai/glm-4.5","tier":"pro"},{"slug":"z-ai/glm-4.5-air","name":"Z.ai: GLM 4.5 Air","shortName":"GLM 4.5 Air","author":"z-ai","authorDisplay":"Z ai","description":"GLM-4.5-Air is the lightweight variant of our latest flagship model family, also purpose-built for agent-centric applications. Like GLM-4.5, it adopts the Mixture-of-Experts (MoE) architecture but with a more compact parameter...","shortDescription":"GLM-4.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":262,"createdAt":"2025-07-25T19:20:58.000Z","group":"z-ai/glm-4.5-air","tier":"basic"},{"slug":"qwen/qwen3-235b-a22b-thinking-2507","name":"Qwen: Qwen3 235B A22B Thinking 2507","shortName":"Qwen3 235B A22B Thinking 2507","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-235B-A22B-Thinking-2507 is a high-performance, open-weight Mixture-of-Experts (MoE) language model optimized for complex reasoning tasks. It activates 22B of its 235B parameters per forward pass and natively supports up to 262,144...","shortDescription":"Qwen3-235B-A22B-Thinking-2507 is a high-performance, open-weight Mixture-of-Experts (MoE) language model optimized for complex reasoning tasks.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":true,"ranking":263,"createdAt":"2025-07-25T13:19:17.000Z","group":"qwen/qwen3-235b-a22b-thinking-2507","tier":"basic"},{"slug":"qwen/qwen3-coder","name":"Qwen: Qwen3 Coder 480B A35B","shortName":"Qwen3 Coder 480B A35B","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-Coder-480B-A35B-Instruct is a Mixture-of-Experts (MoE) code generation model developed by the Qwen team. It is optimized for agentic coding tasks such as function calling, tool use, and long-context reasoning over...","shortDescription":"Qwen3-Coder-480B-A35B-Instruct is a Mixture-of-Experts (MoE) code generation model developed by the Qwen team.","categories":["text","coding"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":264,"createdAt":"2025-07-23T00:29:06.000Z","group":"qwen/qwen3-coder-480b-a35b-07-25","tier":"basic"},{"slug":"bytedance/ui-tars-1.5-7b","name":"ByteDance: UI-TARS 7B","shortName":"UI-TARS 7B","author":"bytedance","authorDisplay":"ByteDance","description":"UI-TARS-1.5 is a multimodal vision-language agent optimized for GUI-based environments, including desktop interfaces, web browsers, mobile systems, and games. Built by ByteDance, it builds upon the UI-TARS framework with reinforcement...","shortDescription":"UI-TARS-1.","categories":["text","multimodal"],"inputModalities":["image","text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":265,"createdAt":"2025-07-22T17:24:16.000Z","group":"bytedance/ui-tars-1.5-7b","tier":"basic"},{"slug":"google/gemini-2.5-flash-lite","name":"Google: Gemini 2.5 Flash Lite","shortName":"Gemini 2.5 Flash Lite","author":"google","authorDisplay":"Google","description":"Gemini 2.5 Flash-Lite is a lightweight reasoning model in the Gemini 2.5 family, optimized for ultra-low latency and cost efficiency. It offers improved throughput, faster token generation, and better performance...","shortDescription":"Gemini 2.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file","audio","video"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":266,"createdAt":"2025-07-22T16:04:36.000Z","group":"google/gemini-2.5-flash-lite","tier":"basic"},{"slug":"qwen/qwen3-235b-a22b-2507","name":"Qwen: Qwen3 235B A22B Instruct 2507","shortName":"Qwen3 235B A22B Instruct 2507","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-235B-A22B-Instruct-2507 is a multilingual, instruction-tuned mixture-of-experts language model based on the Qwen3-235B architecture, with 22B active parameters per forward pass. It is optimized for general-purpose text generation, including instruction following,...","shortDescription":"Qwen3-235B-A22B-Instruct-2507 is a multilingual, instruction-tuned mixture-of-experts language model based on the Qwen3-235B architecture, with 22B active pa...","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":267,"createdAt":"2025-07-21T17:39:15.000Z","group":"qwen/qwen3-235b-a22b-07-25","tier":"basic"},{"slug":"moonshotai/kimi-k2","name":"MoonshotAI: Kimi K2 0711","shortName":"Kimi K2 0711","author":"moonshotai","authorDisplay":"Moonshotai","description":"Kimi K2 Instruct is a large-scale Mixture-of-Experts (MoE) language model developed by Moonshot AI, featuring 1 trillion total parameters with 32 billion active per forward pass. It is optimized for...","shortDescription":"Kimi K2 Instruct is a large-scale Mixture-of-Experts (MoE) language model developed by Moonshot AI, featuring 1 trillion total parameters with 32 billion act...","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":268,"createdAt":"2025-07-11T19:47:32.000Z","group":"moonshotai/kimi-k2","tier":"pro"},{"slug":"cognitivecomputations/dolphin-mistral-24b-venice-edition","name":"Venice: Uncensored","shortName":"Uncensored","author":"cognitivecomputations","authorDisplay":"Cognitivecomputations","description":"Venice Uncensored Dolphin Mistral 24B Venice Edition is a fine-tuned variant of Mistral-Small-24B-Instruct-2501, developed by dphn.ai in collaboration with Venice.ai. This model is designed as an “uncensored” instruct-tuned LLM, preserving...","shortDescription":"Venice Uncensored Dolphin Mistral 24B Venice Edition is a fine-tuned variant of Mistral-Small-24B-Instruct-2501, developed by dphn.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":269,"createdAt":"2025-07-09T21:02:46.000Z","group":"venice/uncensored","tier":"basic"},{"slug":"tencent/hunyuan-a13b-instruct","name":"Tencent: Hunyuan A13B Instruct","shortName":"Hunyuan A13B Instruct","author":"tencent","authorDisplay":"Tencent","description":"Hunyuan-A13B is a 13B active parameter Mixture-of-Experts (MoE) language model developed by Tencent, with a total parameter count of 80B and support for reasoning via Chain-of-Thought. It offers competitive benchmark...","shortDescription":"Hunyuan-A13B is a 13B active parameter Mixture-of-Experts (MoE) language model developed by Tencent, with a total parameter count of 80B and support for reas...","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":270,"createdAt":"2025-07-08T15:14:24.000Z","group":"tencent/hunyuan-a13b-instruct","tier":"basic"},{"slug":"morph/morph-v3-large","name":"Morph: Morph V3 Large","shortName":"Morph V3 Large","author":"morph","authorDisplay":"Morph","description":"Morph's high-accuracy apply model for complex code edits. ~4,500 tokens/sec with 98% accuracy for precise code transformations. The model requires the prompt to be in the following format: {instruction} {initial_code}...","shortDescription":"Morph's high-accuracy apply model for complex code edits.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":271,"createdAt":"2025-07-07T17:54:18.000Z","group":"morph/morph-v3-large","tier":"pro"},{"slug":"morph/morph-v3-fast","name":"Morph: Morph V3 Fast","shortName":"Morph V3 Fast","author":"morph","authorDisplay":"Morph","description":"Morph's fastest apply model for code edits. ~10,500 tokens/sec with 96% accuracy for rapid code transformations. The model requires the prompt to be in the following format: {instruction} {initial_code} {edit_snippet}...","shortDescription":"Morph's fastest apply model for code edits.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":81920,"supportsReasoning":false,"ranking":272,"createdAt":"2025-07-07T17:40:02.000Z","group":"morph/morph-v3-fast","tier":"pro"},{"slug":"baidu/ernie-4.5-vl-424b-a47b","name":"Baidu: ERNIE 4.5 VL 424B A47B","shortName":"ERNIE 4.5 VL 424B A47B","author":"baidu","authorDisplay":"Baidu","description":"ERNIE-4.5-VL-424B-A47B is a multimodal Mixture-of-Experts (MoE) model from Baidu’s ERNIE 4.5 series, featuring 424B total parameters with 47B active per token. It is trained jointly on text and image data...","shortDescription":"ERNIE-4.","categories":["text","multimodal","reasoning"],"inputModalities":["image","text"],"outputModalities":["text"],"contextLength":123000,"supportsReasoning":true,"ranking":273,"createdAt":"2025-06-30T16:28:23.000Z","group":"baidu/ernie-4.5-vl-424b-a47b","tier":"pro"},{"slug":"mistralai/mistral-small-3.2-24b-instruct","name":"Mistral: Mistral Small 3.2 24B","shortName":"Mistral Small 3.2 24B","author":"mistralai","authorDisplay":"Mistral AI","description":"Mistral-Small-3.2-24B-Instruct-2506 is an updated 24B parameter model from Mistral optimized for instruction following, repetition reduction, and improved function calling. Compared to the 3.1 release, version 3.2 significantly improves accuracy on...","shortDescription":"Mistral-Small-3.","categories":["text","multimodal"],"inputModalities":["image","text"],"outputModalities":["text"],"contextLength":256000,"supportsReasoning":false,"ranking":274,"createdAt":"2025-06-20T18:10:16.000Z","group":"mistralai/mistral-small-3.2-24b-instruct-2506","tier":"basic"},{"slug":"minimax/minimax-m1","name":"MiniMax: MiniMax M1","shortName":"MiniMax M1","author":"minimax","authorDisplay":"Minimax","description":"MiniMax-M1 is a large-scale, open-weight reasoning model designed for extended context and high-efficiency inference. It leverages a hybrid Mixture-of-Experts (MoE) architecture paired with a custom \"lightning attention\" mechanism, allowing it...","shortDescription":"MiniMax-M1 is a large-scale, open-weight reasoning model designed for extended context and high-efficiency inference.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":275,"createdAt":"2025-06-17T22:46:54.000Z","group":"minimax/minimax-m1","tier":"pro"},{"slug":"google/gemini-2.5-flash","name":"Google: Gemini 2.5 Flash","shortName":"Gemini 2.5 Flash","author":"google","authorDisplay":"Google","description":"Gemini 2.5 Flash is Google's state-of-the-art workhorse model, specifically designed for advanced reasoning, coding, mathematics, and scientific tasks. It includes built-in \"thinking\" capabilities, enabling it to provide responses with greater...","shortDescription":"Gemini 2.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text","audio","video"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":276,"createdAt":"2025-06-17T15:01:28.000Z","group":"google/gemini-2.5-flash","tier":"basic"},{"slug":"google/gemini-2.5-pro","name":"Google: Gemini 2.5 Pro","shortName":"Gemini 2.5 Pro","author":"google","authorDisplay":"Google","description":"Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks. It employs “thinking” capabilities, enabling it to reason through responses with enhanced accuracy...","shortDescription":"Gemini 2.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file","audio","video"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":277,"createdAt":"2025-06-17T14:12:24.000Z","group":"google/gemini-2.5-pro","tier":"pro"},{"slug":"google/gemini-2.5-pro-preview","name":"Google: Gemini 2.5 Pro Preview 06-05","shortName":"Gemini 2.5 Pro Preview 06-05","author":"google","authorDisplay":"Google","description":"Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks. It employs “thinking” capabilities, enabling it to reason through responses with enhanced accuracy...","shortDescription":"Gemini 2.","categories":["text","multimodal","reasoning"],"inputModalities":["file","image","text","audio"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":278,"createdAt":"2025-06-05T15:27:37.000Z","group":"google/gemini-2.5-pro-preview-06-05","tier":"pro"},{"slug":"deepseek/deepseek-r1-0528","name":"DeepSeek: R1 0528","shortName":"R1 0528","author":"deepseek","authorDisplay":"DeepSeek","description":"May 28th update to the [original DeepSeek R1](/deepseek/deepseek-r1) Performance on par with [OpenAI o1](/openai/o1), but open-sourced and with fully open reasoning tokens. It's 671B parameters in size, with 37B active...","shortDescription":"May 28th update to the [original DeepSeek R1](/deepseek/deepseek-r1) Performance on par with [OpenAI o1](/openai/o1), but open-sourced and with fully open re...","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":163840,"supportsReasoning":true,"ranking":279,"createdAt":"2025-05-28T17:59:30.000Z","group":"deepseek/deepseek-r1-0528","tier":"pro"},{"slug":"anthropic/claude-sonnet-4","name":"Anthropic: Claude Sonnet 4","shortName":"Claude Sonnet 4","author":"anthropic","authorDisplay":"Anthropic","description":"Claude Sonnet 4 significantly enhances the capabilities of its predecessor, Sonnet 3.7, excelling in both coding and reasoning tasks with improved precision and controllability. Achieving state-of-the-art performance on SWE-bench (72.7%),...","shortDescription":"Claude Sonnet 4 significantly enhances the capabilities of its predecessor, Sonnet 3.","categories":["text","multimodal","reasoning"],"inputModalities":["image","text","file"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":true,"ranking":280,"createdAt":"2025-05-22T16:12:51.000Z","group":"anthropic/claude-4-sonnet-20250522","tier":"pro"},{"slug":"google/gemma-3n-e4b-it","name":"Google: Gemma 3n 4B","shortName":"Gemma 3n 4B","author":"google","authorDisplay":"Google","description":"Gemma 3n E4B-it is optimized for efficient execution on mobile and low-resource devices, such as phones, laptops, and tablets. It supports multimodal inputs—including text, visual data, and audio—enabling diverse tasks...","shortDescription":"Gemma 3n E4B-it is optimized for efficient execution on mobile and low-resource devices, such as phones, laptops, and tablets.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":32768,"supportsReasoning":false,"ranking":281,"createdAt":"2025-05-20T21:33:44.000Z","group":"google/gemma-3n-e4b-it","tier":"basic"},{"slug":"mistralai/mistral-medium-3","name":"Mistral: Mistral Medium 3","shortName":"Mistral Medium 3","author":"mistralai","authorDisplay":"Mistral AI","description":"Mistral Medium 3 is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced operational cost. It balances state-of-the-art reasoning and multimodal performance with 8× lower cost...","shortDescription":"Mistral Medium 3 is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced operational cost.","categories":["text","multimodal"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":282,"createdAt":"2025-05-07T14:15:41.000Z","group":"mistralai/mistral-medium-3","tier":"pro"},{"slug":"google/gemini-2.5-pro-preview-05-06","name":"Google: Gemini 2.5 Pro Preview 05-06","shortName":"Gemini 2.5 Pro Preview 05-06","author":"google","authorDisplay":"Google","description":"Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks. It employs “thinking” capabilities, enabling it to reason through responses with enhanced accuracy...","shortDescription":"Gemini 2.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image","file","audio","video"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":true,"ranking":283,"createdAt":"2025-05-07T00:41:53.000Z","group":"google/gemini-2.5-pro-preview-03-25","tier":"pro"},{"slug":"arcee-ai/virtuoso-large","name":"Arcee AI: Virtuoso Large","shortName":"Virtuoso Large","author":"arcee-ai","authorDisplay":"Arcee ai","description":"Virtuoso‑Large is Arcee's top‑tier general‑purpose LLM at 72 B parameters, tuned to tackle cross‑domain reasoning, creative writing and enterprise QA. Unlike many 70 B peers, it retains the 128 k...","shortDescription":"Virtuoso‑Large is Arcee's top‑tier general‑purpose LLM at 72 B parameters, tuned to tackle cross‑domain reasoning, creative writing and enterprise QA.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":284,"createdAt":"2025-05-05T21:01:25.000Z","group":"arcee-ai/virtuoso-large","tier":"pro"},{"slug":"meta-llama/llama-guard-4-12b","name":"Meta: Llama Guard 4 12B","shortName":"Llama Guard 4 12B","author":"meta-llama","authorDisplay":"Meta","description":"Llama Guard 4 is a Llama 4 Scout-derived multimodal pretrained model, fine-tuned for content safety classification. Similar to previous versions, it can be used to classify content in both LLM...","shortDescription":"Llama Guard 4 is a Llama 4 Scout-derived multimodal pretrained model, fine-tuned for content safety classification.","categories":["text","multimodal"],"inputModalities":["image","text"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":false,"ranking":285,"createdAt":"2025-04-30T01:06:33.000Z","group":"meta-llama/llama-guard-4-12b","tier":"basic"},{"slug":"qwen/qwen3-30b-a3b","name":"Qwen: Qwen3 30B A3B","shortName":"Qwen3 30B A3B","author":"qwen","authorDisplay":"Qwen","description":"Qwen3, the latest generation in the Qwen large language model series, features both dense and mixture-of-experts (MoE) architectures to excel in reasoning, multilingual support, and advanced agent tasks. Its unique...","shortDescription":"Qwen3, the latest generation in the Qwen large language model series, features both dense and mixture-of-experts (MoE) architectures to excel in reasoning, m...","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":286,"createdAt":"2025-04-28T22:16:44.000Z","group":"qwen/qwen3-30b-a3b-04-28","tier":"basic"},{"slug":"qwen/qwen3-8b","name":"Qwen: Qwen3 8B","shortName":"Qwen3 8B","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-8B is a dense 8.2B parameter causal language model from the Qwen3 series, designed for both reasoning-heavy tasks and efficient dialogue. It supports seamless switching between \"thinking\" mode for math,...","shortDescription":"Qwen3-8B is a dense 8.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":287,"createdAt":"2025-04-28T21:43:52.000Z","group":"qwen/qwen3-8b-04-28","tier":"basic"},{"slug":"qwen/qwen3-14b","name":"Qwen: Qwen3 14B","shortName":"Qwen3 14B","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-14B is a dense 14.8B parameter causal language model from the Qwen3 series, designed for both complex reasoning and efficient dialogue. It supports seamless switching between a \"thinking\" mode for...","shortDescription":"Qwen3-14B is a dense 14.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":288,"createdAt":"2025-04-28T21:41:18.000Z","group":"qwen/qwen3-14b-04-28","tier":"basic"},{"slug":"qwen/qwen3-32b","name":"Qwen: Qwen3 32B","shortName":"Qwen3 32B","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-32B is a dense 32.8B parameter causal language model from the Qwen3 series, optimized for both complex reasoning and efficient dialogue. It supports seamless switching between a \"thinking\" mode for...","shortDescription":"Qwen3-32B is a dense 32.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":289,"createdAt":"2025-04-28T21:32:25.000Z","group":"qwen/qwen3-32b-04-28","tier":"basic"},{"slug":"qwen/qwen3-235b-a22b","name":"Qwen: Qwen3 235B A22B","shortName":"Qwen3 235B A22B","author":"qwen","authorDisplay":"Qwen","description":"Qwen3-235B-A22B is a 235B parameter mixture-of-experts (MoE) model developed by Qwen, activating 22B parameters per forward pass. It supports seamless switching between a \"thinking\" mode for complex reasoning, math, and...","shortDescription":"Qwen3-235B-A22B is a 235B parameter mixture-of-experts (MoE) model developed by Qwen, activating 22B parameters per forward pass.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":true,"ranking":290,"createdAt":"2025-04-28T21:29:17.000Z","group":"qwen/qwen3-235b-a22b-04-28","tier":"pro"},{"slug":"openai/o4-mini-high","name":"OpenAI: o4 Mini High","shortName":"o4 Mini High","author":"openai","authorDisplay":"OpenAI","description":"OpenAI o4-mini-high is the same model as [o4-mini](/openai/o4-mini) with reasoning_effort set to high. OpenAI o4-mini is a compact reasoning model in the o-series, optimized for fast, cost-efficient performance while retaining...","shortDescription":"OpenAI o4-mini-high is the same model as [o4-mini](/openai/o4-mini) with reasoning_effort set to high.","categories":["text","multimodal","reasoning"],"inputModalities":["image","text","file"],"outputModalities":["text"],"contextLength":200000,"supportsReasoning":true,"ranking":291,"createdAt":"2025-04-16T17:23:32.000Z","group":"openai/o4-mini-high-2025-04-16","tier":"pro"},{"slug":"openai/o3","name":"OpenAI: o3","shortName":"o3","author":"openai","authorDisplay":"OpenAI","description":"o3 is a well-rounded and powerful model across domains. It sets a new standard for math, science, coding, and visual reasoning tasks. It also excels at technical writing and instruction-following....","shortDescription":"o3 is a well-rounded and powerful model across domains.","categories":["text","multimodal","reasoning"],"inputModalities":["image","text","file"],"outputModalities":["text"],"contextLength":200000,"supportsReasoning":true,"ranking":292,"createdAt":"2025-04-16T17:10:57.000Z","group":"openai/o3-2025-04-16","tier":"pro"},{"slug":"openai/o4-mini","name":"OpenAI: o4 Mini","shortName":"o4 Mini","author":"openai","authorDisplay":"OpenAI","description":"OpenAI o4-mini is a compact reasoning model in the o-series, optimized for fast, cost-efficient performance while retaining strong multimodal and agentic capabilities. It supports tool use and demonstrates competitive reasoning...","shortDescription":"OpenAI o4-mini is a compact reasoning model in the o-series, optimized for fast, cost-efficient performance while retaining strong multimodal and agentic cap...","categories":["text","multimodal","reasoning"],"inputModalities":["image","text","file"],"outputModalities":["text"],"contextLength":200000,"supportsReasoning":true,"ranking":293,"createdAt":"2025-04-16T16:29:02.000Z","group":"openai/o4-mini-2025-04-16","tier":"pro"},{"slug":"openai/gpt-4.1","name":"OpenAI: GPT-4.1","shortName":"GPT-4.1","author":"openai","authorDisplay":"OpenAI","description":"GPT-4.1 is a flagship large language model optimized for advanced instruction following, real-world software engineering, and long-context reasoning. It supports a 1 million token context window and outperforms GPT-4o and...","shortDescription":"GPT-4.","categories":["text","multimodal"],"inputModalities":["image","text","file"],"outputModalities":["text"],"contextLength":1047576,"supportsReasoning":false,"ranking":294,"createdAt":"2025-04-14T17:23:05.000Z","group":"openai/gpt-4.1-2025-04-14","tier":"pro"},{"slug":"openai/gpt-4.1-mini","name":"OpenAI: GPT-4.1 Mini","shortName":"GPT-4.1 Mini","author":"openai","authorDisplay":"OpenAI","description":"GPT-4.1 Mini is a mid-sized model delivering performance competitive with GPT-4o at substantially lower latency and cost. It retains a 1 million token context window and scores 45.1% on hard...","shortDescription":"GPT-4.","categories":["text","multimodal"],"inputModalities":["image","text","file"],"outputModalities":["text"],"contextLength":1047576,"supportsReasoning":false,"ranking":295,"createdAt":"2025-04-14T17:23:01.000Z","group":"openai/gpt-4.1-mini-2025-04-14","tier":"pro"},{"slug":"openai/gpt-4.1-nano","name":"OpenAI: GPT-4.1 Nano","shortName":"GPT-4.1 Nano","author":"openai","authorDisplay":"OpenAI","description":"For tasks that demand low latency, GPT‑4.1 nano is the fastest and cheapest model in the GPT-4.1 series. It delivers exceptional performance at a small size with its 1 million...","shortDescription":"For tasks that demand low latency, GPT‑4.","categories":["text","multimodal"],"inputModalities":["image","text","file"],"outputModalities":["text"],"contextLength":1047576,"supportsReasoning":false,"ranking":296,"createdAt":"2025-04-14T17:22:49.000Z","group":"openai/gpt-4.1-nano-2025-04-14","tier":"basic"},{"slug":"meta-llama/llama-4-maverick","name":"Meta: Llama 4 Maverick","shortName":"Llama 4 Maverick","author":"meta-llama","authorDisplay":"Meta","description":"Llama 4 Maverick 17B Instruct (128E) is a high-capacity multimodal language model from Meta, built on a mixture-of-experts (MoE) architecture with 128 experts and 17 billion active parameters per forward...","shortDescription":"Llama 4 Maverick 17B Instruct (128E) is a high-capacity multimodal language model from Meta, built on a mixture-of-experts (MoE) architecture with 128 expert...","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":1048576,"supportsReasoning":false,"ranking":297,"createdAt":"2025-04-05T19:37:02.000Z","group":"meta-llama/llama-4-maverick-17b-128e-instruct","tier":"basic"},{"slug":"meta-llama/llama-4-scout","name":"Meta: Llama 4 Scout","shortName":"Llama 4 Scout","author":"meta-llama","authorDisplay":"Meta","description":"Llama 4 Scout 17B Instruct (16E) is a mixture-of-experts (MoE) language model developed by Meta, activating 17 billion parameters out of a total of 109B. It supports native multimodal input...","shortDescription":"Llama 4 Scout 17B Instruct (16E) is a mixture-of-experts (MoE) language model developed by Meta, activating 17 billion parameters out of a total of 109B.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":1310720,"supportsReasoning":false,"ranking":298,"createdAt":"2025-04-05T19:31:59.000Z","group":"meta-llama/llama-4-scout-17b-16e-instruct","tier":"basic"},{"slug":"deepseek/deepseek-chat-v3-0324","name":"DeepSeek: DeepSeek V3 0324","shortName":"DeepSeek V3 0324","author":"deepseek","authorDisplay":"DeepSeek","description":"DeepSeek V3, a 685B-parameter, mixture-of-experts model, is the latest iteration of the flagship chat model family from the DeepSeek team. It succeeds the [DeepSeek V3](/deepseek/deepseek-chat-v3) model and performs really well...","shortDescription":"DeepSeek V3, a 685B-parameter, mixture-of-experts model, is the latest iteration of the flagship chat model family from the DeepSeek team.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":163840,"supportsReasoning":false,"ranking":299,"createdAt":"2025-03-24T13:59:15.000Z","group":"deepseek/deepseek-chat-v3-0324","tier":"basic"},{"slug":"mistralai/mistral-small-3.1-24b-instruct","name":"Mistral: Mistral Small 3.1 24B","shortName":"Mistral Small 3.1 24B","author":"mistralai","authorDisplay":"Mistral AI","description":"Mistral Small 3.1 24B Instruct is an upgraded variant of Mistral Small 3 (2501), featuring 24 billion parameters with advanced multimodal capabilities. It provides state-of-the-art performance in text-based reasoning and...","shortDescription":"Mistral Small 3.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":300,"createdAt":"2025-03-17T19:15:37.000Z","group":"mistralai/mistral-small-3.1-24b-instruct-2503","tier":"pro"},{"slug":"google/gemma-3-4b-it","name":"Google: Gemma 3 4B","shortName":"Gemma 3 4B","author":"google","authorDisplay":"Google","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities,...","shortDescription":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":301,"createdAt":"2025-03-13T22:38:30.000Z","group":"google/gemma-3-4b-it","tier":"basic"},{"slug":"google/gemma-3-12b-it","name":"Google: Gemma 3 12B","shortName":"Gemma 3 12B","author":"google","authorDisplay":"Google","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities,...","shortDescription":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":302,"createdAt":"2025-03-13T21:50:25.000Z","group":"google/gemma-3-12b-it","tier":"basic"},{"slug":"cohere/command-a","name":"Cohere: Command A","shortName":"Command A","author":"cohere","authorDisplay":"Cohere","description":"Command A is an open-weights 111B parameter model with a 256k context window focused on delivering great performance across agentic, multilingual, and coding use cases. Compared to other leading proprietary...","shortDescription":"Command A is an open-weights 111B parameter model with a 256k context window focused on delivering great performance across agentic, multilingual, and coding...","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":256000,"supportsReasoning":false,"ranking":303,"createdAt":"2025-03-13T19:32:22.000Z","group":"cohere/command-a-03-2025","tier":"pro"},{"slug":"openai/gpt-4o-mini-search-preview","name":"OpenAI: GPT-4o-mini Search Preview","shortName":"GPT-4o-mini Search Preview","author":"openai","authorDisplay":"OpenAI","description":"GPT-4o mini Search Preview is a specialized model for web search in Chat Completions. It is trained to understand and execute web search queries.","shortDescription":"GPT-4o mini Search Preview is a specialized model for web search in Chat Completions.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":304,"createdAt":"2025-03-12T22:22:02.000Z","group":"openai/gpt-4o-mini-search-preview-2025-03-11","tier":"basic"},{"slug":"openai/gpt-4o-search-preview","name":"OpenAI: GPT-4o Search Preview","shortName":"GPT-4o Search Preview","author":"openai","authorDisplay":"OpenAI","description":"GPT-4o Search Previewis a specialized model for web search in Chat Completions. It is trained to understand and execute web search queries.","shortDescription":"GPT-4o Search Previewis a specialized model for web search in Chat Completions.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":305,"createdAt":"2025-03-12T22:19:09.000Z","group":"openai/gpt-4o-search-preview-2025-03-11","tier":"pro"},{"slug":"rekaai/reka-flash-3","name":"Reka Flash 3","shortName":"Reka Flash 3","author":"rekaai","authorDisplay":"Rekaai","description":"Reka Flash 3 is a general-purpose, instruction-tuned large language model with 21 billion parameters, developed by Reka. It excels at general chat, coding tasks, instruction-following, and function calling. Featuring a...","shortDescription":"Reka Flash 3 is a general-purpose, instruction-tuned large language model with 21 billion parameters, developed by Reka.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":65536,"supportsReasoning":true,"ranking":306,"createdAt":"2025-03-12T20:53:33.000Z","group":"rekaai/reka-flash-3","tier":"basic"},{"slug":"google/gemma-3-27b-it","name":"Google: Gemma 3 27B","shortName":"Gemma 3 27B","author":"google","authorDisplay":"Google","description":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities,...","shortDescription":"Gemma 3 introduces multimodality, supporting vision-language input and text outputs.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":262144,"supportsReasoning":false,"ranking":307,"createdAt":"2025-03-12T05:12:39.000Z","group":"google/gemma-3-27b-it","tier":"basic"},{"slug":"thedrummer/skyfall-36b-v2","name":"TheDrummer: Skyfall 36B V2","shortName":"Skyfall 36B V2","author":"thedrummer","authorDisplay":"Thedrummer","description":"Skyfall 36B v2 is an enhanced iteration of Mistral Small 2501, specifically fine-tuned for improved creativity, nuanced writing, role-playing, and coherent storytelling.","shortDescription":"Skyfall 36B v2 is an enhanced iteration of Mistral Small 2501, specifically fine-tuned for improved creativity, nuanced writing, role-playing, and coherent s...","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":32768,"supportsReasoning":false,"ranking":308,"createdAt":"2025-03-10T19:56:06.000Z","group":"thedrummer/skyfall-36b-v2","tier":"pro"},{"slug":"perplexity/sonar-reasoning-pro","name":"Perplexity: Sonar Reasoning Pro","shortName":"Sonar Reasoning Pro","author":"perplexity","authorDisplay":"Perplexity","description":"Note: Sonar Pro pricing includes Perplexity search pricing. See [details here](https://docs.perplexity.ai/guides/pricing#detailed-pricing-breakdown-for-sonar-reasoning-pro-and-sonar-pro) Sonar Reasoning Pro is a premier reasoning model powered by DeepSeek R1 with Chain of Thought (CoT). Designed for...","shortDescription":"Note: Sonar Pro pricing includes Perplexity search pricing.","categories":["text","multimodal","reasoning"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":true,"ranking":309,"createdAt":"2025-03-07T02:08:28.000Z","group":"perplexity/sonar-reasoning-pro","tier":"pro"},{"slug":"perplexity/sonar-pro","name":"Perplexity: Sonar Pro","shortName":"Sonar Pro","author":"perplexity","authorDisplay":"Perplexity","description":"Note: Sonar Pro pricing includes Perplexity search pricing. See [details here](https://docs.perplexity.ai/guides/pricing#detailed-pricing-breakdown-for-sonar-reasoning-pro-and-sonar-pro) For enterprises seeking more advanced capabilities, the Sonar Pro API can handle in-depth, multi-step queries with added extensibility, like...","shortDescription":"Note: Sonar Pro pricing includes Perplexity search pricing.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":200000,"supportsReasoning":false,"ranking":310,"createdAt":"2025-03-07T01:53:43.000Z","group":"perplexity/sonar-pro","tier":"pro"},{"slug":"perplexity/sonar-deep-research","name":"Perplexity: Sonar Deep Research","shortName":"Sonar Deep Research","author":"perplexity","authorDisplay":"Perplexity","description":"Sonar Deep Research is a research-focused model designed for multi-step retrieval, synthesis, and reasoning across complex topics. It autonomously searches, reads, and evaluates sources, refining its approach as it gathers...","shortDescription":"Sonar Deep Research is a research-focused model designed for multi-step retrieval, synthesis, and reasoning across complex topics.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":true,"ranking":311,"createdAt":"2025-03-07T01:34:06.000Z","group":"perplexity/sonar-deep-research","tier":"pro"},{"slug":"mistralai/mistral-saba","name":"Mistral: Saba","shortName":"Saba","author":"mistralai","authorDisplay":"Mistral AI","description":"Mistral Saba is a 24B-parameter language model specifically designed for the Middle East and South Asia, delivering accurate and contextually relevant responses while maintaining efficient performance. Trained on curated regional...","shortDescription":"Mistral Saba is a 24B-parameter language model specifically designed for the Middle East and South Asia, delivering accurate and contextually relevant respon...","categories":["text","multimodal"],"inputModalities":["text","file"],"outputModalities":["text"],"contextLength":32768,"supportsReasoning":false,"ranking":312,"createdAt":"2025-02-17T14:40:39.000Z","group":"mistralai/mistral-saba-2502","tier":"basic"},{"slug":"openai/o3-mini-high","name":"OpenAI: o3 Mini High","shortName":"o3 Mini High","author":"openai","authorDisplay":"OpenAI","description":"OpenAI o3-mini-high is the same model as [o3-mini](/openai/o3-mini) with reasoning_effort set to high. o3-mini is a cost-efficient language model optimized for STEM reasoning tasks, particularly excelling in science, mathematics, and...","shortDescription":"OpenAI o3-mini-high is the same model as [o3-mini](/openai/o3-mini) with reasoning_effort set to high.","categories":["text","multimodal","reasoning"],"inputModalities":["text","file"],"outputModalities":["text"],"contextLength":200000,"supportsReasoning":true,"ranking":313,"createdAt":"2025-02-12T15:03:31.000Z","group":"openai/o3-mini-high-2025-01-31","tier":"pro"},{"slug":"aion-labs/aion-rp-llama-3.1-8b","name":"AionLabs: Aion-RP 1.0 (8B)","shortName":"Aion-RP 1.0 (8B)","author":"aion-labs","authorDisplay":"Aion labs","description":"Aion-RP-Llama-3.1-8B ranks the highest in the character evaluation portion of the RPBench-Auto benchmark, a roleplaying-specific variant of Arena-Hard-Auto, where LLMs evaluate each other’s responses. It is a fine-tuned base model...","shortDescription":"Aion-RP-Llama-3.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":32768,"supportsReasoning":false,"ranking":314,"createdAt":"2025-02-04T19:18:38.000Z","group":"aion-labs/aion-rp-llama-3.1-8b","tier":"pro"},{"slug":"qwen/qwen2.5-vl-72b-instruct","name":"Qwen: Qwen2.5 VL 72B Instruct","shortName":"Qwen2.5 VL 72B Instruct","author":"qwen","authorDisplay":"Qwen","description":"Qwen2.5-VL is proficient in recognizing common objects such as flowers, birds, fish, and insects. It is also highly capable of analyzing texts, charts, icons, graphics, and layouts within images.","shortDescription":"Qwen2.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":315,"createdAt":"2025-02-01T11:45:11.000Z","group":"qwen/qwen2.5-vl-72b-instruct","tier":"pro"},{"slug":"qwen/qwen-plus","name":"Qwen: Qwen-Plus","shortName":"Qwen-Plus","author":"qwen","authorDisplay":"Qwen","description":"Qwen-Plus, based on the Qwen2.5 foundation model, is a 131K context model with a balanced performance, speed, and cost combination.","shortDescription":"Qwen-Plus, based on the Qwen2.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":1000000,"supportsReasoning":false,"ranking":316,"createdAt":"2025-02-01T11:37:20.000Z","group":"qwen/qwen-plus-2025-01-25","tier":"basic"},{"slug":"openai/o3-mini","name":"OpenAI: o3 Mini","shortName":"o3 Mini","author":"openai","authorDisplay":"OpenAI","description":"OpenAI o3-mini is a cost-efficient language model optimized for STEM reasoning tasks, particularly excelling in science, mathematics, and coding. This model supports the `reasoning_effort` parameter, which can be set to...","shortDescription":"OpenAI o3-mini is a cost-efficient language model optimized for STEM reasoning tasks, particularly excelling in science, mathematics, and coding.","categories":["text","multimodal","reasoning"],"inputModalities":["text","file"],"outputModalities":["text"],"contextLength":200000,"supportsReasoning":true,"ranking":317,"createdAt":"2025-01-31T19:28:41.000Z","group":"openai/o3-mini-2025-01-31","tier":"pro"},{"slug":"mistralai/mistral-small-24b-instruct-2501","name":"Mistral: Mistral Small 3","shortName":"Mistral Small 3","author":"mistralai","authorDisplay":"Mistral AI","description":"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks. Released under the Apache 2.0 license, it features both pre-trained and instruction-tuned versions designed...","shortDescription":"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":32768,"supportsReasoning":false,"ranking":318,"createdAt":"2025-01-30T16:43:29.000Z","group":"mistralai/mistral-small-24b-instruct-2501","tier":"basic"},{"slug":"perplexity/sonar","name":"Perplexity: Sonar","shortName":"Sonar","author":"perplexity","authorDisplay":"Perplexity","description":"Sonar is lightweight, affordable, fast, and simple to use — now featuring citations and the ability to customize sources. It is designed for companies seeking to integrate lightweight question-and-answer features...","shortDescription":"Sonar is lightweight, affordable, fast, and simple to use — now featuring citations and the ability to customize sources.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":127072,"supportsReasoning":false,"ranking":319,"createdAt":"2025-01-27T21:36:48.000Z","group":"perplexity/sonar","tier":"pro"},{"slug":"deepseek/deepseek-r1-distill-llama-70b","name":"DeepSeek: R1 Distill Llama 70B","shortName":"R1 Distill Llama 70B","author":"deepseek","authorDisplay":"DeepSeek","description":"DeepSeek R1 Distill Llama 70B is a distilled large language model based on [Llama-3.3-70B-Instruct](/meta-llama/llama-3.3-70b-instruct), using outputs from [DeepSeek R1](/deepseek/deepseek-r1). The model combines advanced distillation techniques to achieve high performance across...","shortDescription":"DeepSeek R1 Distill Llama 70B is a distilled large language model based on [Llama-3.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":8192,"supportsReasoning":true,"ranking":320,"createdAt":"2025-01-23T20:12:49.000Z","group":"deepseek/deepseek-r1-distill-llama-70b","tier":"pro"},{"slug":"deepseek/deepseek-r1","name":"DeepSeek: R1","shortName":"R1","author":"deepseek","authorDisplay":"DeepSeek","description":"DeepSeek R1 is here: Performance on par with [OpenAI o1](/openai/o1), but open-sourced and with fully open reasoning tokens. It's 671B parameters in size, with 37B active in an inference pass....","shortDescription":"DeepSeek R1 is here: Performance on par with [OpenAI o1](/openai/o1), but open-sourced and with fully open reasoning tokens.","categories":["text","reasoning"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":163840,"supportsReasoning":true,"ranking":321,"createdAt":"2025-01-20T13:51:35.000Z","group":"deepseek/deepseek-r1","tier":"pro"},{"slug":"minimax/minimax-01","name":"MiniMax: MiniMax-01","shortName":"MiniMax-01","author":"minimax","authorDisplay":"Minimax","description":"MiniMax-01 is a combines MiniMax-Text-01 for text generation and MiniMax-VL-01 for image understanding. It has 456 billion parameters, with 45.9 billion parameters activated per inference, and can handle a context...","shortDescription":"MiniMax-01 is a combines MiniMax-Text-01 for text generation and MiniMax-VL-01 for image understanding.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":1000192,"supportsReasoning":false,"ranking":322,"createdAt":"2025-01-15T04:31:02.000Z","group":"minimax/minimax-01","tier":"basic"},{"slug":"microsoft/phi-4","name":"Microsoft: Phi 4","shortName":"Phi 4","author":"microsoft","authorDisplay":"Microsoft","description":"[Microsoft Research](/microsoft) Phi-4 is designed to perform well in complex reasoning tasks and can operate efficiently in situations with limited memory or where quick responses are needed. At 14 billion...","shortDescription":"[Microsoft Research](/microsoft) Phi-4 is designed to perform well in complex reasoning tasks and can operate efficiently in situations with limited memory o...","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":16384,"supportsReasoning":false,"ranking":323,"createdAt":"2025-01-10T06:17:52.000Z","group":"microsoft/phi-4","tier":"basic"},{"slug":"deepseek/deepseek-chat","name":"DeepSeek: DeepSeek V3","shortName":"DeepSeek V3","author":"deepseek","authorDisplay":"DeepSeek","description":"DeepSeek-V3 is the latest model from the DeepSeek team, building upon the instruction following and coding abilities of the previous versions. Pre-trained on nearly 15 trillion tokens, the reported evaluations...","shortDescription":"DeepSeek-V3 is the latest model from the DeepSeek team, building upon the instruction following and coding abilities of the previous versions.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":163840,"supportsReasoning":false,"ranking":324,"createdAt":"2024-12-26T19:28:40.000Z","group":"deepseek/deepseek-chat-v3","tier":"basic"},{"slug":"sao10k/l3.3-euryale-70b","name":"Sao10K: Llama 3.3 Euryale 70B","shortName":"Llama 3.3 Euryale 70B","author":"sao10k","authorDisplay":"Sao10k","description":"Euryale L3.3 70B is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k). It is the successor of [Euryale L3 70B v2.2](/models/sao10k/l3-euryale-70b).","shortDescription":"Euryale L3.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":325,"createdAt":"2024-12-18T15:32:08.000Z","group":"sao10k/l3.3-euryale-70b-v2.3","tier":"pro"},{"slug":"cohere/command-r7b-12-2024","name":"Cohere: Command R7B (12-2024)","shortName":"Command R7B (12-2024)","author":"cohere","authorDisplay":"Cohere","description":"Command R7B (12-2024) is a small, fast update of the Command R+ model, delivered in December 2024. It excels at RAG, tool use, agents, and similar tasks requiring complex reasoning...","shortDescription":"Command R7B (12-2024) is a small, fast update of the Command R+ model, delivered in December 2024.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":326,"createdAt":"2024-12-14T06:35:52.000Z","group":"cohere/command-r7b-12-2024","tier":"basic"},{"slug":"meta-llama/llama-3.3-70b-instruct","name":"Meta: Llama 3.3 70B Instruct","shortName":"Llama 3.3 70B Instruct","author":"meta-llama","authorDisplay":"Meta","description":"The Meta Llama 3.3 multilingual large language model (LLM) is a pretrained and instruction tuned generative model in 70B (text in/text out). The Llama 3.3 instruction tuned text only model...","shortDescription":"The Meta Llama 3.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":327,"createdAt":"2024-12-06T17:28:57.000Z","group":"meta-llama/llama-3.3-70b-instruct","tier":"basic"},{"slug":"amazon/nova-lite-v1","name":"Amazon: Nova Lite 1.0","shortName":"Nova Lite 1.0","author":"amazon","authorDisplay":"Amazon","description":"Amazon Nova Lite 1.0 is a very low-cost multimodal model from Amazon that focused on fast processing of image, video, and text inputs to generate text output. Amazon Nova Lite...","shortDescription":"Amazon Nova Lite 1.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":300000,"supportsReasoning":false,"ranking":328,"createdAt":"2024-12-05T22:22:43.000Z","group":"amazon/nova-lite-v1","tier":"basic"},{"slug":"amazon/nova-micro-v1","name":"Amazon: Nova Micro 1.0","shortName":"Nova Micro 1.0","author":"amazon","authorDisplay":"Amazon","description":"Amazon Nova Micro 1.0 is a text-only model that delivers the lowest latency responses in the Amazon Nova family of models at a very low cost. With a context length...","shortDescription":"Amazon Nova Micro 1.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":329,"createdAt":"2024-12-05T22:20:37.000Z","group":"amazon/nova-micro-v1","tier":"basic"},{"slug":"amazon/nova-pro-v1","name":"Amazon: Nova Pro 1.0","shortName":"Nova Pro 1.0","author":"amazon","authorDisplay":"Amazon","description":"Amazon Nova Pro 1.0 is a capable multimodal model from Amazon focused on providing a combination of accuracy, speed, and cost for a wide range of tasks. As of December...","shortDescription":"Amazon Nova Pro 1.","categories":["text","multimodal"],"inputModalities":["text","image"],"outputModalities":["text"],"contextLength":300000,"supportsReasoning":false,"ranking":330,"createdAt":"2024-12-05T22:05:03.000Z","group":"amazon/nova-pro-v1","tier":"pro"},{"slug":"openai/gpt-4o-2024-11-20","name":"OpenAI: GPT-4o (2024-11-20)","shortName":"GPT-4o (2024-11-20)","author":"openai","authorDisplay":"OpenAI","description":"The 2024-11-20 version of GPT-4o offers a leveled-up creative writing ability with more natural, engaging, and tailored writing to improve relevance & readability. It’s also better at working with uploaded...","shortDescription":"The 2024-11-20 version of GPT-4o offers a leveled-up creative writing ability with more natural, engaging, and tailored writing to improve relevance & readab...","categories":["text","multimodal"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":331,"createdAt":"2024-11-20T18:33:14.000Z","group":"openai/gpt-4o-2024-11-20","tier":"pro"},{"slug":"mistralai/mistral-large-2407","name":"Mistral Large 2407","shortName":"Mistral Large 2407","author":"mistralai","authorDisplay":"Mistral AI","description":"This is Mistral AI's flagship model, Mistral Large 2 (version mistral-large-2407). It's a proprietary weights-available model and excels at reasoning, code, JSON, chat, and more. Read the launch announcement [here](https://mistral.ai/news/mistral-large-2407/)....","shortDescription":"This is Mistral AI's flagship model, Mistral Large 2 (version mistral-large-2407).","categories":["text","multimodal"],"inputModalities":["text","file"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":332,"createdAt":"2024-11-19T01:06:55.000Z","group":"mistralai/mistral-large-2407","tier":"pro"},{"slug":"qwen/qwen-2.5-coder-32b-instruct","name":"Qwen2.5 Coder 32B Instruct","shortName":"Qwen2.5 Coder 32B Instruct","author":"qwen","authorDisplay":"Qwen","description":"Qwen2.5-Coder is the latest series of Code-Specific Qwen large language models (formerly known as CodeQwen). Qwen2.5-Coder brings the following improvements upon CodeQwen1.5: - Significantly improvements in **code generation**, **code reasoning**...","shortDescription":"Qwen2.","categories":["text","coding"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":32768,"supportsReasoning":false,"ranking":333,"createdAt":"2024-11-11T23:40:00.000Z","group":"qwen/qwen-2.5-coder-32b-instruct","tier":"pro"},{"slug":"thedrummer/unslopnemo-12b","name":"TheDrummer: UnslopNemo 12B","shortName":"UnslopNemo 12B","author":"thedrummer","authorDisplay":"Thedrummer","description":"UnslopNemo v4.1 is the latest addition from the creator of Rocinante, designed for adventure writing and role-play scenarios.","shortDescription":"UnslopNemo v4.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":32768,"supportsReasoning":false,"ranking":334,"createdAt":"2024-11-08T22:04:08.000Z","group":"thedrummer/unslopnemo-12b","tier":"pro"},{"slug":"anthracite-org/magnum-v4-72b","name":"Magnum v4 72B","shortName":"Magnum v4 72B","author":"anthracite-org","authorDisplay":"Anthracite org","description":"This is a series of models designed to replicate the prose quality of the Claude 3 models, specifically Sonnet(https://openrouter.ai/anthropic/claude-3.5-sonnet) and Opus(https://openrouter.ai/anthropic/claude-3-opus).\n\nThe model is fine-tuned on top of [Qwen2.5 72B](https://openrouter.ai/qwen/qwen-2.5-72b-instruct).","shortDescription":"This is a series of models designed to replicate the prose quality of the Claude 3 models, specifically Sonnet(https://openrouter.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":16384,"supportsReasoning":false,"ranking":335,"createdAt":"2024-10-22T00:00:00.000Z","group":"anthracite-org/magnum-v4-72b","tier":"pro"},{"slug":"qwen/qwen-2.5-7b-instruct","name":"Qwen: Qwen2.5 7B Instruct","shortName":"Qwen2.5 7B Instruct","author":"qwen","authorDisplay":"Qwen","description":"Qwen2.5 7B is the latest series of Qwen large language models. Qwen2.5 brings the following improvements upon Qwen2: - Significantly more knowledge and has greatly improved capabilities in coding and...","shortDescription":"Qwen2.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":32768,"supportsReasoning":false,"ranking":336,"createdAt":"2024-10-16T00:00:00.000Z","group":"qwen/qwen-2.5-7b-instruct","tier":"basic"},{"slug":"inflection/inflection-3-pi","name":"Inflection: Inflection 3 Pi","shortName":"Inflection 3 Pi","author":"inflection","authorDisplay":"Inflection","description":"Inflection 3 Pi powers Inflection's [Pi](https://pi.ai) chatbot, including backstory, emotional intelligence, productivity, and safety. It has access to recent news, and excels in scenarios like customer support and roleplay. Pi...","shortDescription":"Inflection 3 Pi powers Inflection's [Pi](https://pi.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":8000,"supportsReasoning":false,"ranking":337,"createdAt":"2024-10-11T00:00:00.000Z","group":"inflection/inflection-3-pi","tier":"pro"},{"slug":"inflection/inflection-3-productivity","name":"Inflection: Inflection 3 Productivity","shortName":"Inflection 3 Productivity","author":"inflection","authorDisplay":"Inflection","description":"Inflection 3 Productivity is optimized for following instructions. It is better for tasks requiring JSON output or precise adherence to provided guidelines. It has access to recent news. For emotional...","shortDescription":"Inflection 3 Productivity is optimized for following instructions.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":8000,"supportsReasoning":false,"ranking":338,"createdAt":"2024-10-11T00:00:00.000Z","group":"inflection/inflection-3-productivity","tier":"pro"},{"slug":"thedrummer/rocinante-12b","name":"TheDrummer: Rocinante 12B","shortName":"Rocinante 12B","author":"thedrummer","authorDisplay":"Thedrummer","description":"Rocinante 12B is designed for engaging storytelling and rich prose. Early testers have reported: - Expanded vocabulary with unique and expressive word choices - Enhanced creativity for vivid narratives -...","shortDescription":"Rocinante 12B is designed for engaging storytelling and rich prose.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":65536,"supportsReasoning":false,"ranking":339,"createdAt":"2024-09-30T00:00:00.000Z","group":"thedrummer/rocinante-12b","tier":"basic"},{"slug":"meta-llama/llama-3.2-1b-instruct","name":"Meta: Llama 3.2 1B Instruct","shortName":"Llama 3.2 1B Instruct","author":"meta-llama","authorDisplay":"Meta","description":"Llama 3.2 1B is a 1-billion-parameter language model focused on efficiently performing natural language tasks, such as summarization, dialogue, and multilingual text analysis. Its smaller size allows it to operate...","shortDescription":"Llama 3.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":60000,"supportsReasoning":false,"ranking":340,"createdAt":"2024-09-25T00:00:00.000Z","group":"meta-llama/llama-3.2-1b-instruct","tier":"basic"},{"slug":"meta-llama/llama-3.2-3b-instruct","name":"Meta: Llama 3.2 3B Instruct","shortName":"Llama 3.2 3B Instruct","author":"meta-llama","authorDisplay":"Meta","description":"Llama 3.2 3B is a 3-billion-parameter multilingual large language model, optimized for advanced natural language processing tasks like dialogue generation, reasoning, and summarization. Designed with the latest transformer architecture, it...","shortDescription":"Llama 3.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":341,"createdAt":"2024-09-25T00:00:00.000Z","group":"meta-llama/llama-3.2-3b-instruct","tier":"basic"},{"slug":"qwen/qwen-2.5-72b-instruct","name":"Qwen2.5 72B Instruct","shortName":"Qwen2.5 72B Instruct","author":"qwen","authorDisplay":"Qwen","description":"Qwen2.5 72B is the latest series of Qwen large language models. Qwen2.5 brings the following improvements upon Qwen2: - Significantly more knowledge and has greatly improved capabilities in coding and...","shortDescription":"Qwen2.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":32768,"supportsReasoning":false,"ranking":342,"createdAt":"2024-09-19T00:00:00.000Z","group":"qwen/qwen-2.5-72b-instruct","tier":"pro"},{"slug":"cohere/command-r-08-2024","name":"Cohere: Command R (08-2024)","shortName":"Command R (08-2024)","author":"cohere","authorDisplay":"Cohere","description":"command-r-08-2024 is an update of the [Command R](/models/cohere/command-r) with improved performance for multilingual retrieval-augmented generation (RAG) and tool use. More broadly, it is better at math, code and reasoning and...","shortDescription":"command-r-08-2024 is an update of the [Command R](/models/cohere/command-r) with improved performance for multilingual retrieval-augmented generation (RAG) a...","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":343,"createdAt":"2024-08-30T00:00:00.000Z","group":"cohere/command-r-08-2024","tier":"basic"},{"slug":"cohere/command-r-plus-08-2024","name":"Cohere: Command R+ (08-2024)","shortName":"Command R+ (08-2024)","author":"cohere","authorDisplay":"Cohere","description":"command-r-plus-08-2024 is an update of the [Command R+](/models/cohere/command-r-plus) with roughly 50% higher throughput and 25% lower latencies as compared to the previous Command R+ version, while keeping the hardware footprint...","shortDescription":"command-r-plus-08-2024 is an update of the [Command R+](/models/cohere/command-r-plus) with roughly 50% higher throughput and 25% lower latencies as compared...","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":344,"createdAt":"2024-08-30T00:00:00.000Z","group":"cohere/command-r-plus-08-2024","tier":"pro"},{"slug":"sao10k/l3.1-euryale-70b","name":"Sao10K: Llama 3.1 Euryale 70B v2.2","shortName":"Llama 3.1 Euryale 70B v2.2","author":"sao10k","authorDisplay":"Sao10k","description":"Euryale L3.1 70B v2.2 is a model focused on creative roleplay from [Sao10k](https://ko-fi.com/sao10k). It is the successor of [Euryale L3 70B v2.1](/models/sao10k/l3-euryale-70b).","shortDescription":"Euryale L3.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":345,"createdAt":"2024-08-28T00:00:00.000Z","group":"sao10k/l3.1-euryale-70b","tier":"pro"},{"slug":"nousresearch/hermes-3-llama-3.1-70b","name":"Nous: Hermes 3 70B Instruct","shortName":"Hermes 3 70B Instruct","author":"nousresearch","authorDisplay":"Nousresearch","description":"Hermes 3 is a generalist language model with many improvements over [Hermes 2](/models/nousresearch/nous-hermes-2-mistral-7b-dpo), including advanced agentic capabilities, much better roleplaying, reasoning, multi-turn conversation, long context coherence, and improvements across the...","shortDescription":"Hermes 3 is a generalist language model with many improvements over [Hermes 2](/models/nousresearch/nous-hermes-2-mistral-7b-dpo), including advanced agentic...","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":346,"createdAt":"2024-08-18T00:00:00.000Z","group":"nousresearch/hermes-3-llama-3.1-70b","tier":"pro"},{"slug":"nousresearch/hermes-3-llama-3.1-405b","name":"Nous: Hermes 3 405B Instruct","shortName":"Hermes 3 405B Instruct","author":"nousresearch","authorDisplay":"Nousresearch","description":"Hermes 3 is a generalist language model with many improvements over Hermes 2, including advanced agentic capabilities, much better roleplaying, reasoning, multi-turn conversation, long context coherence, and improvements across the...","shortDescription":"Hermes 3 is a generalist language model with many improvements over Hermes 2, including advanced agentic capabilities, much better roleplaying, reasoning, mu...","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":347,"createdAt":"2024-08-16T00:00:00.000Z","group":"nousresearch/hermes-3-llama-3.1-405b","tier":"pro"},{"slug":"sao10k/l3-lunaris-8b","name":"Sao10K: Llama 3 8B Lunaris","shortName":"Llama 3 8B Lunaris","author":"sao10k","authorDisplay":"Sao10k","description":"Lunaris 8B is a versatile generalist and roleplaying model based on Llama 3. It's a strategic merge of multiple models, designed to balance creativity with improved logic and general knowledge....","shortDescription":"Lunaris 8B is a versatile generalist and roleplaying model based on Llama 3.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":8192,"supportsReasoning":false,"ranking":348,"createdAt":"2024-08-13T00:00:00.000Z","group":"sao10k/l3-lunaris-8b","tier":"basic"},{"slug":"openai/gpt-4o-2024-08-06","name":"OpenAI: GPT-4o (2024-08-06)","shortName":"GPT-4o (2024-08-06)","author":"openai","authorDisplay":"OpenAI","description":"The 2024-08-06 version of GPT-4o offers improved performance in structured outputs, with the ability to supply a JSON schema in the respone_format. Read more [here](https://openai.com/index/introducing-structured-outputs-in-the-api/). GPT-4o (\"o\" for \"omni\") is...","shortDescription":"The 2024-08-06 version of GPT-4o offers improved performance in structured outputs, with the ability to supply a JSON schema in the respone_format.","categories":["text","multimodal"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":349,"createdAt":"2024-08-06T00:00:00.000Z","group":"openai/gpt-4o-2024-08-06","tier":"pro"},{"slug":"meta-llama/llama-3.1-70b-instruct","name":"Meta: Llama 3.1 70B Instruct","shortName":"Llama 3.1 70B Instruct","author":"meta-llama","authorDisplay":"Meta","description":"Meta's latest class of model (Llama 3.1) launched with a variety of sizes & flavors. This 70B instruct-tuned version is optimized for high quality dialogue usecases. It has demonstrated strong...","shortDescription":"Meta's latest class of model (Llama 3.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":350,"createdAt":"2024-07-23T00:00:00.000Z","group":"meta-llama/llama-3.1-70b-instruct","tier":"pro"},{"slug":"meta-llama/llama-3.1-8b-instruct","name":"Meta: Llama 3.1 8B Instruct","shortName":"Llama 3.1 8B Instruct","author":"meta-llama","authorDisplay":"Meta","description":"Meta's latest class of model (Llama 3.1) launched with a variety of sizes & flavors. This 8B instruct-tuned version is fast and efficient. It has demonstrated strong performance compared to...","shortDescription":"Meta's latest class of model (Llama 3.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":351,"createdAt":"2024-07-23T00:00:00.000Z","group":"meta-llama/llama-3.1-8b-instruct","tier":"basic"},{"slug":"mistralai/mistral-nemo","name":"Mistral: Mistral Nemo","shortName":"Mistral Nemo","author":"mistralai","authorDisplay":"Mistral AI","description":"A 12B parameter model with a 128k token context length built by Mistral in collaboration with NVIDIA. The model is multilingual, supporting English, French, German, Spanish, Italian, Portuguese, Chinese, Japanese,...","shortDescription":"A 12B parameter model with a 128k token context length built by Mistral in collaboration with NVIDIA.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":131072,"supportsReasoning":false,"ranking":352,"createdAt":"2024-07-19T00:00:00.000Z","group":"mistralai/mistral-nemo","tier":"basic"},{"slug":"openai/gpt-4o-mini","name":"OpenAI: GPT-4o-mini","shortName":"GPT-4o-mini","author":"openai","authorDisplay":"OpenAI","description":"GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs. As their most advanced small model, it is many multiples more affordable...","shortDescription":"GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs.","categories":["text","multimodal"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":353,"createdAt":"2024-07-18T00:00:00.000Z","group":"openai/gpt-4o-mini","tier":"basic"},{"slug":"openai/gpt-4o-mini-2024-07-18","name":"OpenAI: GPT-4o-mini (2024-07-18)","shortName":"GPT-4o-mini (2024-07-18)","author":"openai","authorDisplay":"OpenAI","description":"GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs. As their most advanced small model, it is many multiples more affordable...","shortDescription":"GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs.","categories":["text","multimodal"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":354,"createdAt":"2024-07-18T00:00:00.000Z","group":"openai/gpt-4o-mini-2024-07-18","tier":"basic"},{"slug":"google/gemma-2-27b-it","name":"Google: Gemma 2 27B","shortName":"Gemma 2 27B","author":"google","authorDisplay":"Google","description":"Gemma 2 27B by Google is an open model built from the same research and technology used to create the [Gemini models](/models?q=gemini). Gemma models are well-suited for a variety of...","shortDescription":"Gemma 2 27B by Google is an open model built from the same research and technology used to create the [Gemini models](/models.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":8192,"supportsReasoning":false,"ranking":355,"createdAt":"2024-07-13T00:00:00.000Z","group":"google/gemma-2-27b-it","tier":"pro"},{"slug":"openai/gpt-4o","name":"OpenAI: GPT-4o","shortName":"GPT-4o","author":"openai","authorDisplay":"OpenAI","description":"GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs. It maintains the intelligence level of [GPT-4 Turbo](/models/openai/gpt-4-turbo) while being twice as...","shortDescription":"GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs.","categories":["text","multimodal"],"inputModalities":["text","image","file"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":356,"createdAt":"2024-05-13T00:00:00.000Z","group":"openai/gpt-4o","tier":"pro"},{"slug":"mistralai/mixtral-8x22b-instruct","name":"Mistral: Mixtral 8x22B Instruct","shortName":"Mixtral 8x22B Instruct","author":"mistralai","authorDisplay":"Mistral AI","description":"Mistral's official instruct fine-tuned version of [Mixtral 8x22B](/models/mistralai/mixtral-8x22b). It uses 39B active parameters out of 141B, offering unparalleled cost efficiency for its size. Its strengths include: - strong math, coding,...","shortDescription":"Mistral's official instruct fine-tuned version of [Mixtral 8x22B](/models/mistralai/mixtral-8x22b).","categories":["text","multimodal"],"inputModalities":["text","file"],"outputModalities":["text"],"contextLength":65536,"supportsReasoning":false,"ranking":357,"createdAt":"2024-04-17T00:00:00.000Z","group":"mistralai/mixtral-8x22b-instruct","tier":"pro"},{"slug":"microsoft/wizardlm-2-8x22b","name":"WizardLM-2 8x22B","shortName":"WizardLM-2 8x22B","author":"microsoft","authorDisplay":"Microsoft","description":"WizardLM-2 8x22B is Microsoft AI's most advanced Wizard model. It demonstrates highly competitive performance compared to leading proprietary models, and it consistently outperforms all existing state-of-the-art opensource models. It is...","shortDescription":"WizardLM-2 8x22B is Microsoft AI's most advanced Wizard model.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":65535,"supportsReasoning":false,"ranking":358,"createdAt":"2024-04-16T00:00:00.000Z","group":"microsoft/wizardlm-2-8x22b","tier":"pro"},{"slug":"mistralai/mistral-large","name":"Mistral Large","shortName":"Mistral Large","author":"mistralai","authorDisplay":"Mistral AI","description":"This is Mistral AI's flagship model, Mistral Large 2 (version `mistral-large-2407`). It's a proprietary weights-available model and excels at reasoning, code, JSON, chat, and more. Read the launch announcement [here](https://mistral.ai/news/mistral-large-2407/)....","shortDescription":"This is Mistral AI's flagship model, Mistral Large 2 (version `mistral-large-2407`).","categories":["text","multimodal"],"inputModalities":["text","file"],"outputModalities":["text"],"contextLength":128000,"supportsReasoning":false,"ranking":359,"createdAt":"2024-02-26T00:00:00.000Z","group":"mistralai/mistral-large","tier":"pro"},{"slug":"openrouter/auto","name":"Auto Router","shortName":"Auto Router","author":"openrouter","authorDisplay":"Openrouter","description":"Your prompt will be processed by a meta-model and routed to one of dozens of models (see below), optimizing for the best possible output. To see which model was used,...","shortDescription":"Your prompt will be processed by a meta-model and routed to one of dozens of models (see below), optimizing for the best possible output.","categories":["image","text","multimodal","reasoning"],"inputModalities":["text","image","audio","file","video"],"outputModalities":["text","image"],"contextLength":2000000,"supportsReasoning":true,"ranking":360,"createdAt":"2023-11-08T00:00:00.000Z","group":"openrouter/auto","tier":"basic"},{"slug":"mancer/weaver","name":"Mancer: Weaver (alpha)","shortName":"Weaver (alpha)","author":"mancer","authorDisplay":"Mancer","description":"An attempt to recreate Claude-style verbosity, but don't expect the same level of coherence or memory. Meant for use in roleplay/narrative situations.","shortDescription":"An attempt to recreate Claude-style verbosity, but don't expect the same level of coherence or memory.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":8000,"supportsReasoning":false,"ranking":361,"createdAt":"2023-08-02T00:00:00.000Z","group":"mancer/weaver","tier":"pro"},{"slug":"undi95/remm-slerp-l2-13b","name":"ReMM SLERP 13B","shortName":"ReMM SLERP 13B","author":"undi95","authorDisplay":"Undi95","description":"A recreation trial of the original MythoMax-L2-B13 but with updated models. #merge","shortDescription":"A recreation trial of the original MythoMax-L2-B13 but with updated models.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":6144,"supportsReasoning":false,"ranking":362,"createdAt":"2023-07-22T00:00:00.000Z","group":"undi95/remm-slerp-l2-13b","tier":"pro"},{"slug":"gryphe/mythomax-l2-13b","name":"MythoMax 13B","shortName":"MythoMax 13B","author":"gryphe","authorDisplay":"Gryphe","description":"One of the highest performing and most popular fine-tunes of Llama 2 13B, with rich descriptions and roleplay. #merge","shortDescription":"One of the highest performing and most popular fine-tunes of Llama 2 13B, with rich descriptions and roleplay.","categories":["text"],"inputModalities":["text"],"outputModalities":["text"],"contextLength":8192,"supportsReasoning":false,"ranking":363,"createdAt":"2023-07-02T00:00:00.000Z","group":"gryphe/mythomax-l2-13b","tier":"basic"}],"categories":[{"id":"text","label":"Text","count":319},{"id":"multimodal","label":"Multimodal","count":218},{"id":"reasoning","label":"Reasoning","count":202},{"id":"image","label":"Image","count":36},{"id":"coding","label":"Coding","count":19},{"id":"video","label":"Video","count":17}]}]]}]}],["$","section",null,{"aria-labelledby":"cta-heading","className":"bg-primary/10 py-20 md:py-32 dark:bg-muted/50","children":["$","div",null,{"className":"mx-auto max-w-5xl px-4 text-center sm:px-6 lg:px-8","children":[["$","h2",null,{"id":"cta-heading","className":"mb-6 font-bold text-3xl md:text-4xl","children":"Access all models in one platform"}],["$","p",null,{"className":"mx-auto mb-10 max-w-3xl text-muted-foreground text-xl md:text-2xl","children":"GPT-5, Claude, Gemini, Sora, FLUX, and 200+ more AI models - all in one subscription."}],["$","div",null,{"className":"flex flex-col justify-center gap-4 sm:flex-row","children":["$","$L8",null,{"href":"/login?utm_source=models&utm_campaign=models-index&utm_content=footer-cta","children":"Start 3-day free trial","data-slot":"button","className":"$9","ref":null}]}]]}]}]]}],["$","footer",null,{"className":"border-t border-border bg-background","children":["$","div",null,{"className":"container mx-auto max-w-7xl px-6 py-20 md:py-24","children":["$","nav",null,{"aria-label":"Footer navigation","className":"grid grid-cols-2 md:grid-cols-5 gap-8 md:gap-12","children":[["$","div",null,{"className":"col-span-2 md:col-span-1","children":["$","p",null,{"className":"text-sm text-muted-foreground","children":"© 2025 Writingmate"}]}],["$","div",null,{"children":[["$","h3",null,{"className":"font-semibold text-base text-foreground mb-4","children":"Company"}],["$","ul",null,{"className":"space-y-2","children":[["$","li",null,{"children":["$","$L8",null,{"href":"/about","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"About Us"}]}],["$","li",null,{"children":["$","$L8",null,{"href":"/team","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"The Team"}]}],["$","li",null,{"children":["$","$L8",null,{"href":"mailto:hello@writingmate.ai","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"Email Us"}]}]]}]]}],["$","div",null,{"children":[["$","h3",null,{"className":"font-semibold text-base text-foreground mb-4","children":"Resources"}],["$","ul",null,{"className":"space-y-2","children":[["$","li",null,{"children":["$","$L8",null,{"href":"https://writingmate.ai/docs","target":"_blank","rel":"noopener noreferrer","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"User Manual"}]}],["$","li",null,{"children":["$","$L8",null,{"href":"/blog","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"Blog"}]}],["$","li",null,{"children":["$","$L8",null,{"href":"/models","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"AI Models Directory"}]}],["$","li",null,{"children":["$","$L8",null,{"href":"/text-to-image","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"AI Image Generation"}]}],["$","li",null,{"children":["$","$L8",null,{"href":"/text-to-video","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"AI Video Generation"}]}],["$","li",null,{"children":["$","$L8",null,{"href":"/changelog","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"Changelog"}]}],["$","li",null,{"children":["$","$L8",null,{"href":"/docs/chat-ai-models/openai-compatible-api","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"OpenAI-Compatible API"}]}],["$","li",null,{"children":["$","$L8",null,{"href":"/free-tools","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"Free AI Tools"}]}],["$","li",null,{"children":["$","$L8",null,{"href":"https://aidictation.com/?utm_source=writingmate","target":"_blank","rel":"noopener noreferrer","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"AIDictation - AI Voice to Text"}]}],["$","li",null,{"children":["$","$L8",null,{"href":"https://aiformedical.com/?utm_source=writingmate","target":"_blank","rel":"noopener noreferrer","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"AI For Medical"}]}],["$","li",null,{"children":["$","$L8",null,{"href":"https://mentioned.to","target":"_blank","rel":"noopener","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"Reddit Marketing Tool"}]}]]}]]}],["$","div",null,{"children":[["$","h3",null,{"className":"font-semibold text-base text-foreground mb-4","children":"Legal"}],["$","ul",null,{"className":"space-y-2","children":[["$","li",null,{"children":["$","$L8",null,{"href":"https://writingmate.ai/docs/security-and-privacy/writingmate-terms-of-service","target":"_blank","rel":"noopener noreferrer","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"Terms of Service"}]}],["$","li",null,{"children":["$","$L8",null,{"href":"https://writingmate.ai/docs/subscription-and-billing/writingmate-refund-policy","target":"_blank","rel":"noopener noreferrer","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"Refund Policy"}]}],["$","li",null,{"children":["$","$L8",null,{"href":"https://writingmate.ai/docs/security-and-privacy/writingmate-privacy-policy","target":"_blank","rel":"noopener noreferrer","className":"text-sm text-muted-foreground hover:text-foreground transition-colors","children":"Privacy Policy"}]}]]}]]}],["$","div",null,{"children":[["$","h3",null,{"className":"font-semibold text-base text-foreground mb-4","children":"Social"}],["$","ul",null,{"className":"space-y-2","children":[["$","li",null,{"children":["$","$L8",null,{"href":"https://www.linkedin.com/company/writingmate/","target":"_blank","rel":"noopener noreferrer","className":"flex items-center gap-2 text-sm text-muted-foreground hover:text-foreground transition-colors","children":[["$","svg",null,{"ref":"$undefined","xmlns":"http://www.w3.org/2000/svg","width":24,"height":24,"viewBox":"0 0 24 24","fill":"none","stroke":"currentColor","strokeWidth":2,"strokeLinecap":"round","strokeLinejoin":"round","className":"lucide lucide-linkedin h-4 w-4","children":[["$","path","c2jq9f",{"d":"M16 8a6 6 0 0 1 6 6v7h-4v-7a2 2 0 0 0-2-2 2 2 0 0 0-2 2v7h-4v-7a6 6 0 0 1 6-6z"}],["$","rect","mk3on5",{"width":"4","height":"12","x":"2","y":"9"}],["$","circle","bt5ra8",{"cx":"4","cy":"4","r":"2"}],"$undefined"]}],"LinkedIn"]}]}],["$","li",null,{"children":["$","$L8",null,{"href":"https://x.com/writingmateai","target":"_blank","rel":"noopener noreferrer","className":"flex items-center gap-2 text-sm text-muted-foreground hover:text-foreground transition-colors","children":[["$","svg",null,{"width":"15","height":"15","viewBox":"0 0 15 15","fill":"none","xmlns":"http://www.w3.org/2000/svg","className":"h-4 w-4","ref":"$undefined","children":["$","path",null,{"d":"$a","fill":"currentColor","fillRule":"evenodd","clipRule":"evenodd"}]}],"X (Twitter)"]}]}],["$","li",null,{"children":["$","$L8",null,{"href":"https://www.youtube.com/@writingmate","target":"_blank","rel":"noopener noreferrer","className":"flex items-center gap-2 text-sm text-muted-foreground hover:text-foreground transition-colors","children":[["$","svg",null,{"ref":"$undefined","xmlns":"http://www.w3.org/2000/svg","width":24,"height":24,"viewBox":"0 0 24 24","fill":"none","stroke":"currentColor","strokeWidth":2,"strokeLinecap":"round","strokeLinejoin":"round","className":"lucide lucide-youtube h-4 w-4","children":[["$","path","1q2vi4",{"d":"M2.5 17a24.12 24.12 0 0 1 0-10 2 2 0 0 1 1.4-1.4 49.56 49.56 0 0 1 16.2 0A2 2 0 0 1 21.5 7a24.12 24.12 0 0 1 0 10 2 2 0 0 1-1.4 1.4 49.55 49.55 0 0 1-16.2 0A2 2 0 0 1 2.5 17"}],["$","path","1jp15x",{"d":"m10 15 5-3-5-3z"}],"$undefined"]}],"YouTube"]}]}],["$","li",null,{"children":["$","$L8",null,{"href":"https://discord.gg/PePZDQGH","target":"_blank","rel":"noopener noreferrer","className":"flex items-center gap-2 text-sm text-muted-foreground hover:text-foreground transition-colors","children":[["$","svg",null,{"width":"15","height":"15","viewBox":"0 0 15 15","fill":"none","xmlns":"http://www.w3.org/2000/svg","className":"h-4 w-4","ref":"$undefined","children":["$","path",null,{"fillRule":"evenodd","clipRule":"evenodd","d":"$b","fill":"currentColor"}]}],"Discord"]}]}]]}]]}]]}]}]}]]}],null,["$","$Lc",null,{"children":["$Ld","$Le",["$","$Lf",null,{"promise":"$@10"}]]}]]}],{},null,false]},null,false]},null,false],["$","$1","h",{"children":[null,["$","$1","TYyRLbc6oSvj0z5sXmikXv",{"children":[["$","$L11",null,{"children":"$L12"}],["$","meta",null,{"name":"next-size-adjust","content":""}]]}],["$","$L13",null,{"children":"$L14"}]]}],false]],"m":"$undefined","G":["$15","$undefined"],"s":false,"S":false}

AI Models Directory

AI Models

All Models

Access all models in one platform